From eb0850bca61f96cc9c5d2ab6b170b5eaec256c0d Mon Sep 17 00:00:00 2001 From: Jinx Date: Fri, 10 Apr 2026 06:37:43 +0000 Subject: [PATCH] Fix: correct source dataset tag names for tool_call/tool_response --- __pycache__/prepare_data.cpython-312.pyc | Bin 0 -> 7935 bytes prepare_data.py | 10 +++++----- 2 files changed, 5 insertions(+), 5 deletions(-) create mode 100644 __pycache__/prepare_data.cpython-312.pyc diff --git a/__pycache__/prepare_data.cpython-312.pyc b/__pycache__/prepare_data.cpython-312.pyc new file mode 100644 index 0000000000000000000000000000000000000000..33a28f5e6ec23c886cc5da61b987a455be2ea0fd GIT binary patch literal 7935 zcmeHMZEPDydY&bhUrSP?BvK!iY_C2nnYJlKmeY%6MUJcw$6u6VDLzMy!_eH7M1|z) zW|x-5P(9|5_Gs9JWi+Vhy9Abz0FhxG;2#C*0tM>+XnMu<2WiS@X5#`X>H_C~vSr|| z1`70@C3h+7q&5W#v_Cq6W@l&KdFP$kd7t-#zp~pI1mzb$%ZL8G3ZZ`?FKVHSjkS6T zp?SoiQN&T4E=-M5%2PM0gQq^MkIM6dr~;l%Z`PjyjO}5qBe%<2QrbD#4d(qJKES# zRN}EH@!@a)1I1*ZUE?l#BeAd)l43XtwENpwpAZwz@FE|;!HM>_c^u(I?_ew%ltMz( z+gFgsd$xmNjtJ5O8xwhUcmm`-dU}M&6$wb}?lCMx+AjveG2X*Yhkz;+gefa4fAbZ*km24r0;3x7t?Sc0=qnwJ; zA={NP%!^Y(ROI7jg(2;|vOA$o_KQ*gONpL%`T9;i%0X9ku}ht((YiMdDD*)c$e|W9 zH1zPlmV|m9jiXszg2JN~Bo#FQp#&vqGwu{y*ew}U7L!J`ReB~URcoSDf|}JQ^w`Vk zCaon3wZ-W_MG1XBQtzocZ!Zd4$8aPtxNS)A4maF5X zCudF=ILqfcl{bYFs2|Ny=PMAJH71Ocl_grW#W7p-TREG03hHy#v<0nwi~h1rc$gC= z&aCJyb=3!L$3=wQTkOY~Fu%H=tK%@E9A=Cr%#&_)52dFBh*>D5)6}H5BrKcGsnO=g;i2HF1(WUnMUhgrYcLjHPn4QYqkdPSDa_ROl3Qlr{h zH)r#k;@l|R9Cg)ABWah)fnaPxx5<5F5{yXAPzl{IYC@7~kh6|0tyk3MK*GFU+uS$HvErp&SeZc`zDHO-<|w zz`V#XgkvNyQ!qdRm?N;F5doGMD_S>^e7(XF1+yhh@WjAj_D3-u&$KBVh)h#hxESJK zJ;k`G(^)Yz4wehfUQ`A`QMQ{H39+YJu^wU%d+yXp#q@PCOmT>bM;UdPVFp1YJ`kMH zL{fy^$6}t?XE+P;DOusdBp;MEEKUxD4MaIOwDDMkk4l;l;uIeY1qwE|i;4FzAAj6P zs2jW3ZdGFC+VHfpoUD7=VXvZS}LWY6p@6Cd~=`7*LmoB@XDF)?@81=W97!`_8C;sK}>4SSC08sm!1 zp10akXD=U2TOU}PUKo(2DqVileZ!reS!~SJdY8@KXL=wk>fN4wl&4Z=LSiUNlq|^0 zdQrmI0Ze5Bai&DsaeR2l*Utw9jvv5SzyK~nD2f{hiB;X-fUjRR2BrW~I85MOHUW-= zK_6uk?0)Fp*XCR1#j3j%Irc!#@j47SUGwJa=5+N!^Vhp? z?Or^1_d>4mV9wcdR!GFm>TiTSZf9uz_-qi-OyBE#KUGq#)hw|DN2Dt5Oh;|#3r=Bs$ zRtq~{u~sIBe)j^R>>hkm|4laq zbr3qWLg0l!#o7n(ndjGe=$z(lQ%KUlgh0p=t%Arb@$D(%_nwadAnCw6(>!=>1@N}V zkv2oW1&vYlqi5-a9(*>BWKuaKXi4*TR6bajprbVj8e#^`|DV)+dUYnm8MMkb3Sc>F zkO(FyC819kRBpsyhc$x$o11z1;E9LUoyOH^@ZB`8h%-x?r(cRtAgZu@p;y<2*nk>F z9>y2ne-hA$So!Z4*s^VHZSj`xM=KkYSQ{KEgE$oqNtj?NbP_|3{{Y%A4J_;JVPDp; zVjwaVE*g7q9fYuAt;O4nY?#8Z8YbS1f`Awd4Z;Km6g0(7(jw4+Ni-_!!+i9%N!9_t znu<(iJr<^wwQ(;YQDRjQ!bdDyig?3wBKf#QI4WRKl@jx65xpAy;!{BQA^eLZ3P_^I zv?aszEYpV{Tiltdp8Mm=7GLs6zRZ~fJuH8Y%!UIgeZHpdrs;-h!2xJcb0B5UJ1gf+ z*G*|t&dH_>-#Y3+*&lCjT{J9-%iBAz5Bx*yubcm7&tL7i|L$_viOlE+Da&J5`(69J znVjob$|74`d0XW*-(_F=_@X6KxBsE76QIg);6(*8FsXshn&!s;Y~S3D%+4QVm^YT` zgL!L3(zgcUqW{-4ati-Dn%1dm+V@NgDXP}`J&7?%yWqp5B3h>0bVbMT5%Stcs(w-( zg=(wIKB1(j{9{4wvY!U(ACVdBF8kqS`Yq+MAHF}mY#I7LdD*cKgns3+TcAS^|7*X7 z8j_~~zF{;A!Qy6qDcLP4#G~ERfaoMG9i*5a!WjyI)lKOQC4&Jg8<$LX2%xDmG=ov- zBef=hPO_`LV5qbdh1v&{Mc^mtr%jE8nKLh0RKr3M0|_ao&5}WqmR?X-S9!y}HlIPF z38no042d}FO5qquOQMv_-_Ow(>rzz`2{x26sii*D9)u)TZI>ikH-mV_8%k*%kX<)P zjK+onF$yRIb|h$S3yN)UQc|lrjk8MR4k=}`{Ya47DU>+49IBk^xkJ*9tYZM4#sm$C zIs`4#x-+t^%zPI^_U(o(v7sbvT*XqQ z%8zrA1iyL)kXZ53$O1oDkUy0MoVd~raVMBp@59v~xHP5lsuHgmNIZ2w5^Y*Xq4z-J zfcvguVyW7PVcRHf^Lhm(!|mllIBsYsiE9!aOEXgtI6=q~fINNN?)63jm%K$UAzpVf z6bX^+xdZ{e>W}Px?M=vOdpvr41{mXEsAQUCQAU8DiTt<#*#X(iUxJ9pFMJetF(b-+ z9GF&lbg@r~hQ>`J<+~q<`>CZ{NtVA)ic>{FrQ*#v%9}h4{XT2j{WlQH8Z4 z8pOhiaDLKdg%6-Hw7_XWm>GjzSV>b|$gX&r+AE{@n|_jsk&A6|2V{B*e$SApF_{uY za?Yjr6IungkB-1s!WUuiC-5(R2j4D9VEa zd#xF|8p6O*r(-F2uOrj$BGSoOMUC|4F%fjwA6}uDm6AJWrQBqFq_q zl^$8_&(N-Ax?`onl{}HB9gpa$EM2u+?afuUFVnC6e$NwdJ#7tNH7$IUYuuk{=*%z& zmg(1@(9BOyd~)J5dYN`VhPLk$-`t^PdgqGC`p8tBHC3k@9+>L#RSlWO&V>VynmV&h zotdfwDeDtw|k8^cq!t|1O_fW3=aHj3845LKG&3hNmXPOS(8weUrJtEOgv`eYxh~z5Z;?TMwPR&-8@mw|X+^g%MfG=8SXF+*nF@Xx_1Eg#}-f zfoGgyS{~A^zqJyo!U8Wv5}|!#={UO6@b^0nM|WFfv)@l{fZy+-e4c9AFjUz)ok0v8MOJ@}7+h#-sjw@^WNO;OKiD@CtuLzL}1 zWdA2r^RK93#Zj5GlcsQF=egoN%N`^!F{&p z%Nml_ywgKkyOP#5;~SLg`9-RXs(jw4R87?G)sqyWZK?PJeeJij`Hu%z^@!f4Z1Fz; D4={gg literal 0 HcmV?d00001 diff --git a/prepare_data.py b/prepare_data.py index 8bd93a9..f088939 100644 --- a/prepare_data.py +++ b/prepare_data.py @@ -21,11 +21,11 @@ from datasets import load_dataset VAL_FRACTION = 0.05 SEED = 42 -# Hermes-style tags (used in the source datasets) -TC_OPEN = chr(60) + "tool" + chr(62) # -TC_CLOSE = chr(60) + "/tool" + chr(62) # -TR_OPEN = chr(60) + "tool_response" + chr(62) # -TR_CLOSE = chr(60) + "/tool_response" + chr(62) # +# Tags used in the source datasets +TC_OPEN = chr(60) + "tool_call" + chr(62) +TC_CLOSE = chr(60) + "/tool_call" + chr(62) +TR_OPEN = chr(60) + "tool_response" + chr(62) +TR_CLOSE = chr(60) + "/tool_response" + chr(62) # SmolLM3 native tokens SMOL_TC_START = "<|tool_call_start|>"