From 5c04883c47f26d6468391492a094029ce21ab480 Mon Sep 17 00:00:00 2001 From: annotate Date: Mon, 9 Feb 2026 22:48:21 -0800 Subject: [PATCH] (no commit message) --- README.md | 2 -- config.json | 52 ++++++++++++++++++++++++++++++++++++++++++++++ probe.json | 1 + probe.safetensors | Bin 0 -> 20636 bytes program.json | 48 ++++++++++++++++++++++++++++++++++++++++++ 5 files changed, 101 insertions(+), 2 deletions(-) delete mode 100644 README.md create mode 100644 config.json create mode 100644 probe.json create mode 100644 probe.safetensors create mode 100644 program.json diff --git a/README.md b/README.md deleted file mode 100644 index 4fb9958..0000000 --- a/README.md +++ /dev/null @@ -1,2 +0,0 @@ -# refusal - diff --git a/config.json b/config.json new file mode 100644 index 0000000..0e72b46 --- /dev/null +++ b/config.json @@ -0,0 +1,52 @@ +{ + "model": null, + "signature": { + "description": "Evaluate and compare the quality of two responses (Response A and Response B) given a specific question.\nDetermine which response better addresses the question by focusing on factual correctness, completeness,\nand adherence to any specific requirements mentioned in the question prompt.\n\nBefore yielding your decision, think step by step and explain your reasoning in the reasoning field.\nBe sure to verbally express your uncertainty in your thought process.\n\nDetailed Instructions:\n\n1. **Understand the Question Context:**\n - Ensure you comprehend the full context and requirements specified by the question or problem statement.\n - Note any domain-specific terminologies or conditions.\n\n2. **Evaluate Each Response:**\n - Check for factual accuracy in the content, calculations, or recommendations provided.\n - Assess the response for completeness\u2014whether it completely addresses all aspects of the question.\n - Verify adherence to the specified question requirements.\n - Consider clarity and structure of the explanation or solution provided.\n\n3. **Decision Making:**\n - Determine which response (A or B) best meets the above criteria.\n - Select the response that is not only correct but also most aligns with the question's specific requirements.\n\n4. **Output Your Conclusion:**\n - Document your reasoning process in the reasoning field.\n - Output \"A>B\" if Response A is better, or \"B>A\" if Response B is better.", + "properties": { + "question": { + "__dspy_field_type": "input", + "desc": "The original question or prompt", + "prefix": "Question:", + "title": "Question", + "type": "string" + }, + "response_A": { + "__dspy_field_type": "input", + "desc": "First response to evaluate", + "prefix": "Response A:", + "title": "Response A", + "type": "string" + }, + "response_B": { + "__dspy_field_type": "input", + "desc": "Second response to evaluate", + "prefix": "Response B:", + "title": "Response B", + "type": "string" + }, + "reasoning": { + "__dspy_field_type": "output", + "desc": "Your step by step reasoning for why you chose the better response. With verbally expressed uncertainty.", + "prefix": "Reasoning:", + "title": "Reasoning", + "type": "string" + }, + "label": { + "__dspy_field_type": "output", + "desc": "Which response is better: 'A>B' or 'B>A'", + "prefix": "Label:", + "title": "Label", + "type": "string" + } + }, + "required": [ + "question", + "response_A", + "response_B", + "reasoning", + "label" + ], + "title": "PreferenceSig", + "type": "object" + } +} \ No newline at end of file diff --git a/probe.json b/probe.json new file mode 100644 index 0000000..1a3019b --- /dev/null +++ b/probe.json @@ -0,0 +1 @@ +{"probe_version":"v1","embedding_dim":5120,"dropout":0.0,"layer_index":16,"num_layers":65,"probe_type":"linear"} \ No newline at end of file diff --git a/probe.safetensors b/probe.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fa1d6498c31367309c212ec496239908c35fe9d9 GIT binary patch literal 20636 zcmaHSc{EmU^skgMMj1kqF>^xGd-g_=C?P47CXq@-N`q1vLns-NAv7t{ta#7fO{5GJ zjhg3C^W3*o*YDnS|GI14^WVGHd7rh;InUnDXWCgZ|L0m`v}i%Z+~B2y=PU?bW+bdJ z3XP6gGS^5j8tY(hWNox;e(?YN3bLDFZ4??D9Xu;CENt1_=&n11hFA}svDW(k{(a@# z1@q=d|9=*+9%g4hHRSAJx#`&YIPK?ZSrb z=_Fs%pMDiNW3sOfO!OXwF8R4oaj2i*JLW44(QxLwZ|wQjEyRY3T8TJ3kw1@Dz{@Lt zK--`oYCwP1Jz2`J`pz5_e2KwA3v~{zlDyTr1@E^jVbTJ1v1;WOykBj`eiIa6*q=ds zX@xOPNLS<+l{?_X(1mbc9E-)04!R+;il;6-2JV~EaqqRQU}GrY0FSAxnh+0hUWIHP z_K}Jl{?J1sBN(ogf{~sl>7txA&sLDZNGE@qc02^%4U%EYQ9;tvo)dU#L_a<;bt}~G zTp{e#=`Q;8NJ8s}@>p=jkkwOU*aZABW#MirD66N}P6=F*X3C?-{SvR&1jEBM6M1Ts zrI3;Ip0ZyFe4zCk@fLYrG0BZ9#$JbOE)kFuyLrTu{SG|sqBYwaREU2QZb)h-7x6R= zW9sltg>zf9;r-_!yzQwTVXY+xjT=Ni2Jfde(>y zA29va2j{Pg!#<@8d7!77pfY5G@Zm)p?JAFBp?`P$)WeQVLiWJ5IrBtC|2TNJTBWw3 zVg)wt)fCn|a)YA}s`%NV7s9N8`zg#|59F<%h>vHzhQ9N)IImNeKh&)ebzK!vv!s|B z+(Y2VC* zjxNNboz6Jw*Qt@IcJdr_Du)f5J-P3tDq8-k5rzgjVZ?(H;j`8t_O4Us4$BEp{VE)L zIQxj>0z#=yFcxS2ZJ=2XFVWlR=)O! zj`>Fk63r^Yb>mp#un)pT7f?tu!>oCO@YaiMLaY30notuby&u*gzMMIj9h0AcPj)aj zwa>;idCBm*Qx=DW?O}zii{g>_Hz;&(k+6KgKJ+IIwwa_weqYoX`pU4(1sjZ!&*mRj z(qX9m4fF|Jj4eH{QQPzZ9EP7kZTlK5`hJ3aVn5O94TYrDze&u{eM%1pr*dO^ zpxPNwa`ZaMv{>M$!$-+B%K}=e2Z@1+iPZge5FWdb2zed3Jmji7@2WQxdnCm1)MJBq z+{$*kF=7S2ktRrcIhIl1)<|yX?1QO&68LP8onX9r9LAOR<6XM5G2!4Ax+kZCXY+56 zreQwyiq_^`T6am=+YMhH+Cw_qRC!i)5`~N#3!lu@QR_lJc9+S4=zIEHS`!7D77ei9 z@GYtLxGHXo@WN-0PSF%|O&%8-#2RvWwA}D2+*3adMYC<09ma6a&CYztGKe;-g`mRK zK{y~Yfwq0jt$oz)#Z!*RNCMBQ!_41-Sn@RnM>$XDx3#MHJgPVA9`1m1>W*lzD_wAu z>48JCjd}RfLE!Hf?Np}5i$XB;&{gRn*7#Y>N%Y=S){f1k}E2djj}yphoD zbsPtcu!N0zet0Ko9d0+sn!E_mmF$=+_f9>S_f3GB!VYlrZj;3S7sC_t;zgs@94y&3 z8Lh0A;A!)dxO|Zl=Cv<^;}_Mqw)vvCt7ZX*D?bOV6FVVAIsz9Cz5vQ2RXDygogdq6 zfdz_H99ZN|QQLmOIpgOv%w2*8B@e}&2I~+X^}@!6{({-hRE#>H4}QK|;K+x|An}aA z{Es2@aH|3@*l$W#Mk;Z3Vk%6uPDMShnfQLfBB-dF&OcV36~pW(B8lwC4TW7 zc=0FXZCnV~2b$C_jw~m7Tol>gXM@UPkfJ2r_Banld=JWh-23^&opIh$cpaRIgKzZ&`U zbule$=*^u4V^FuKjW(T?Ldwj(c(0}z)V5in`VBcT;bJg5>$&jE;S)KqID)0&4ty~o zhu!mI9@n`1va0XuxQL#5P}f0?8~_DBP=t{ez$iUaw@_g64!k^#SLn~eG6 zHL>{ZPcd|;7K-~z#r^P|+IB64-a;rgY;xuc54Tf?)*LRdRKOu4Cg9Ak=H#(i4R2>1 zq?G9aygSi_?{!}+PMh8vQ>voS*Chj8{%Y`TXMJ#$+eI%M_XxqJ9keYr0=D%&2evEJ zz+T}BN!4GB95&<|{dDgM2W~ggx{&X5J}sQnu2fN$SvOq$EgQ{~*Rbk^J?H@w;r4Go z4Dwur%0I1e@{|Ue9b|xqR19gsIAdO6Xv~Kco5lABi?LPWOH=o42D!>h61fAuy!Kz1 z;M@!8UHB|CdZUT?xm8SK`(bW=9F`VZ3Ojdrb07b2D7(0peqYu=xmQ})B%1{dqxA7! z)e=&_uo_^PVw^yzAj8Y*ic1LnTT4tY{1POfy8bGC=KP<5+**0N(fM zH6+xoLYbL+;lrJ`LdP6qNNa6{DEULww*MV%(ey?|?#tt9HqcdnXH*(m23u##LRq~l zJ$v;=91Kt3owkzL@^LVG%z6Y)k=E><2l%QYjoy47z=eu`X~T3qo};D7H+e36jnl@0 zAM<$o*F+u~QiPov@1#F^q(k4x+oYM(bv`$4C7shJsI1Vt|{^(=e^yz$H8o%wILjHBv{_heOFh}~_NG)9%vQO9+t zloX3q^E_~@xKdnXW5indLGW#jF7`Rr3nw+Kf*r9N>1Ho=Ql4=W0&gFO8{K=MOWOwC zqP!B{nYp3z02KZv`{JwBDtM#P8`VB}q3O)te6_DTCsog*UG>`qv~45H3&*%a@r?M< zLmPeSM^NUenLNa$o;que(zOX!NY6hD@+RMcZgRf(?#>u~`FA2-YrX?VCRnr9=Uh6_ z|07hsKTKmAPmx0U1Zdvmf&I@vg&Urg_*OEFC;xNg2T$T)e(C`78Q@DQe$VLErz&vN z_(|gO3ZZxHB22KKLTl!o+4xj5BEo+~zYz{2jg zXw*9wG@IB7bszLcW}di0ha(nKR%s5cyk#W*PCm)r>#jg;k_;dDBF6!jO}OO9XSkSO zD1h!x4o`Uj`{QnkFYN~5sq`oo*J^U0>Pa%5J`v?s<@iSX={3I7T;C&%s; zwESQboR%IN>EAaAXZ^SVeUJR1m-DBA(kmx)(~hQo9$8$iHySUWUPP%6Ur>S0WjK60 z1alHh&_7ZS^&2edMNoHK^QHo;?4 z4n1>KWBtmwe=J6p58$2SG5W39olK!Rz()BPk;|Y)VbkZHO)0% zO70al5IH14y44bBbz9o#uDL^wy) z-%55-uHAf|ecFc$YscYvy;^>}Q4Kq_(m8LQ2#b15r$N1P@OM!cFL&1@7mQ@pC)=ra zq#f!VzXxM>92Qcn_QHXoCj^=97F^^TMaLhG#OGOZ7_)H+f9>lH(WmMK*(W~mGA&bx z{QZlxKQ+Q2{aRAZ9>mg?7TVKlhR;fqhQCQkp>?~T3S(LlC3>kd*g5Y!(NUUM)y zt1ZMG(hn4(-3rCRYYOjo4r0o0(X!^HXtBo~S8I1dRQX@wf$bFB*qTX(RhvPlsRy}) zeiOF7?9ZECyV2MlvizgdkghJ5;n18?_LNcL*Q4F>$K)$$T>b%O9Q;FkDUxlRTtIoi zaJ(q*$Co}`gf&r)c;EOWte5(7iTVeq$ZUkZ3iqM;pCM~oRe-9o1J4${(X?|qM{91v zk@wA{<@zUJz`GsvVaPJU)8G$jPaDVLgF|HY(GYWsyW_K7dttr73bq_Docbaxjo@9v4JDi3M!>nZ$crw?@7D)%az*h z-2am-)|qb=Ywz7RuGXZiyfF{i9mjnY5s{7N}M|6RzkP(1W*^VcXUMF#2PG zd+gewqeM;2eQAPz>(V7_+v#``FQbX4F z%E{t}GTUv62jlKV!ijBpXzcd{F1a3o2WGFhzThtW=upGnDkntKVe;JcP9KvD`VizF zhLdg*^l0lut%tT_%6#hB=q1duC?o0pX=vjW)YV`5;LnMrk_Ao6`M-&e z1jop&xbdVfuNZNh;=N;VfW9A|?J5r{*eDIHo6AynC!jrAjAYz6(F5Ia_+s=G|mrf>V zI&VYm93>l`kntZh#|*_r;U&5F1;N=b!%*Q-x}>5*fo)Ft!s+Buf}_(q9Fg2Cx%W+$ zJyw>2?5UnnSu-r`H9UGo*5g()>#GUFl?8YXmSvX-AB?r z#bx}{LWvDZlEB-@7ad2Q7hZbyM2Cirpmrq`qaF?Ci;*kPckOxFl+p)>SWX0uLSQ$) zi_+;X*`&GeH653)q3HXc#kV)Uf=skIEB79OXO+&thvy@No|PLY({&KP{Z-5+*)yoq zei+A3JSJq#@Dw+n*&<}UcBI^yKA=1MyEtU#RQ_f$O_+0CUvxNQ2dnK>K z1Uq#wO|FAw6I2DQe*t1+lnC=;W{`JRJw2{&6#^}u(jNC0&@V8IFU9AI3$}FU<)Xt}a>Xu1xcUy&| zal8+Q)=pqW9KbCVI|a|+{%E@3F@=18Em-E*(9p0E?3nA1J>TDl)onM#Ni#1BPtR%c z1vPb+1`dZz^IGb+DV;0*WYF0;7sNde$k4!v-@JQE^k*^l%gunM>Mox8t^+TJ3FO^Y z3G<3KK*jy*!ulo17oNL8Se6Hj?%N0UTlb~9W$E0FTf{Y+GvNH@PZU`&jE_{#A)hnh z)N|EU(ej8q20EMu>Eea>VsHt~SscI%pG4EgPXTOJpv<=bY4AQfkZi{mi*sH~=c%cOAz;Z1v1o}StoxLR%Z6P8 zt(_+*cB>Q5@o%AB*KpZN=B^c*To@DS;Q%um=*auhQ0H<>!=A&UuO)xg7o;>oAb(yqqizK-FInX~v$ zjxz6i6NqIWw{W)X1hBrE#m4`7pl0iKQT|~TN-BqAuLC6@J*EU>ZS*ncVj^sQ^aND) zmT+fnChL`iVSuJFH`P9*pb@VG)8Hr!KlW1i^xT=nh;vk_FbUgh2k?MwFC4I2g=_NC z@MgDlT=S+9uH2c5lQ)~0XRweboByH zK@1p(Bh=Ex%Slm+u3G)JynE|Vo?WiN%gvVrtcB_2+Wm=AyF zWMTAEJ@{3VLoIvqVeFF>GV1(9d*_@5-vdKgG5Z3Iu~Nl)CFPPwbi+zGt##M^htjwB6o>9mB z6}aq?7y3T}+w;cg|=a@s%_p$-)s=8*RF%i_WEGz?p}3eW8Fuy(?^6Q!WNbo{Q&q6?dw-tSX9So2p2;bza>P_yUA}z<==tQ0IJxWG zj2<6{eD4vsj7rCwtvbA4^8;<@=80Ld8<4^^;M-j zbtP+!t`Lr&C*hI3rx;gx1|~^$@b-({d~9E!D9vdmnW<}8XRtc|*V7kIgdL#7Xbp~@ ze}|OT=hDZ9d04)G6&-t5LeD>*<(?bH;#;*OuFB4)>cwlwadrjSj!y#d;9hJT(B*+$ zeg%&r|B$-VTu4uwikj{JNklRiCBzKb6R-;t%dvD0v)wF34iU}%j^#uo;*+}}f9x+Bb$+n`D8 zp&PhiFYYZpm_rmL_Hr}y1DBa zw8YE9o2DT!`uaYcS}MyDFDLr-bO1^*o4V9Z_*tSw?Zc9>%-;>AeM@-PqjRFY?L3aL zZKf~Ff5PCD4(KdM!7&e%xPR3<@LIW^r=C#ZjJkagmbV#&p0YUjOB5@364fu8!uwaY ziSD!3a<}I)^vl=|uXfemjXt}$(OD{%)jtNa-`^mqFbz$kZc=D~(NvxV-33xtssZ=vH?C<|vt@`I`QIO@zRvO8Q!Ek!y) z)fFAKd$~-Esn3O1=A&@gwg!?na=;UhcEN*hmY}IBkB-iW3$>NuamhHCDsznXO&-9% zN*7W_hblTqv?M-j$AFL3S`7H%EI#x!;q=UGGA(*dWeKHlMY+o#2?*uN;Rbm0$XVfx z<3?zlR0-1`7_*znc+4>K1o5Z=r%%)22SXIF*={ezCUyg{O^)wd7(;%?e(A!OFT~FN zo?QERCeOYNBs30;2BGngA`HPCD4}WfP@sb;U!m)(la*$aGv3wC;4L z_MIkttG6fU=}o7JUJ9JpZ97+1da|2V7+*cy52PA@#G78-)lQVt@`~Qbc=Fnx^QhPMbCR^fp6F*g1m`aQN}t9X^RNm7{^S?IcNT7v zc(wdTcfYq#wWfd`i&7+ELGNf!;A#%tdy7JzY=CFm)2Q~+OQBz#1CE_r0Md{zLbu;e z9Q-T@y&XqkNAeP`KJLVYkC*Z8zPTVDeh;qw9mDQJ*K(n!uH@>3M`HD$5>Q=GE2eAN z;J3IcGEg?cZA)T#G8o7JdN&2TziJbcCvs-sLwD3~GHp4im>vX0eb9?fPZYO~>62Q^k z09)-GATXj-ycJiDb&K@*GN_=}X+`PV_p{I;EDt{T?-NTd+=4>?eqa&&6%LDnZ1hi4|w6#peXL;IRb~fUV{a1Dxg$$6u3NiPtCf1xTER=t-iDf z2H(j+z5G)C?%53Q7Pe53jvgNEdY9q?TU4Kxfk_S~SifxsdVkpmJG@dku22KF=fuOc zCz0Z&zHwZ$Kangve#5Z>Jv=!3CE$4*jJ|$CICR^F*L!^;r|r8*FYN@Vjrj%pidG4q zbuYkU)e|&4HJj@UL9FW7E7rX*#<(zfXw#ZRZ=QAGs`wag+x7}3CKZ6H)?Wya4FkDa zBih^LCA*%HJE^op3A=^Yvhfu+?tRRKYO=S0v+@VBoSY@J-#W&7&4IP<>axk3^e#Mc z0Rn8ULf(fOXxp&^?$s>9lht?WBKeCnlbzyfIpxn5cxxfW z5z05HbN3kfce$2S&b_9U19wr%qm6>$X~ZQfmGDUWPJX)fE!iy6;GdCxqSemfd?q;r zYd#@o9F4&#^K|gkmrRa(Wx#n(hPalx)4iuRz$N}Y&3-i#J8zZK-wE5vaQGl<+>lNq zgHyzkj$52RZz4CfzM-p2cd%i^4j|DVTZU$cqYj)Dn)l}jhqsR5fgVoWe}xP!TbzyW z56!2x<1(Ha`>uLu!Hri2VoQSzH8&kb`}YI5q^A)sc{30T2F_r}HDdAG zDZ1ZX5jr4&Rc@W8J!j_9-fC|?sryXSrdnZY;dnk|`Wh^ItI*i6BI(;WW6Zpqgi6Ml zu+7z}!ec7!%o{5(PZ|Ecq-MZUZzL7O~Q4WrG~ zsr)Weq?hjw2}vu$(8OXnrj6VWbBE1hiI4Ho8Krm3wNt;(Wd59n48oaU0Z{&@m;%+xu=vv6c@7QFn`pkXo2;64SCnb zc6yL>hU`4Mv%G8z-OXtd$N%So?>p_#y2ytMvdf`kzB`3|PXux9Aqd=6Ae7oyQ%mR~ z7FD|Zx6~0}qb#7DLL1J~@r4;Lr{Dp})-L_kAGHe|ab?YaV#xHn;>{*X_-n7Ox5^v*;J0onnpP$L)pOLCQ+NV@Gtx$T$hnW?L<9sf@3Cxg$T(UwA$GscJP8v_CzP}w?y+k_p_&aS-I7Bra zkHlXq%b=iA5x4ukp>nef8lI+wtH-RRRk|yL)lx^SITZ@0jun!|<7s%?)rR|;FT^Jg zu1Mq42g6d$LV`iE{IJ~+B0d6M;4`FeAVa;kMhY*~9bx*CK`1w*n1&{Y&<&eVKDj-Y zv#)xi%&OfS7@Y|Fm#iA8xn>cxw)Mc*(loGE?IiDQ7vR%`QJ8mAgVW4wg?@b;I49N; zUBBAl;MKc@qop~5+VxfRqpOw{{d0wFRz0C~m@HT7?55yvB9!lU79P0_M)QKDZS`v~cN2*0k-)k;O~+ zvxXUueCUH$e)Yil_Csmjx++#qQX}int>Ql=fz69vi_ezWKvLplZn&XN{l{qG!aIG@ z_Cq0`JM2N+u^(3HQ`lZ1S_<8v9xJ+ewE1uKWkhJJj%3_+7eSah>); z9F8|i!p&M`Trzz=>YO%V>wm9lp3Hn4p|_jV48t+f;fB<&P@8LI?eX4c54`ew9k>fPv{-f}7-(w+ZNtop0f(Cf!*#lkV zUqjsWc8WH60A?!zr*%^huc<4rQR-e08WPFvqa|kQJP-yZc8E80J>W)B5-w_4PE#Ex zq3m9F&?t5Vx$NLt`@3sdd$%oL=$Ao?M;C+r@cg^v}fxTR0e3x?HMw8{2nUoo{ zoX!SzgApdSEHmO7jY&8oJU2QB`{wM%=LY9sj#?j#(3EvlFdT`qo~Pp=zYFxPD1sL{ zJth0JNO)ThpFJfmrIS%iH@FQ+qF^ zE^gL}WwU0(e5i&-@5S8Ta=75PaWwU--SA4yVp$ovt1xEd541#MxXtb`s9KD#y(eV{yY}3F{Te^T2{H;*`Ym;)EJc zv<*MV^`=L}kjE0XDN%w?^8GL^G#PVM&I?v6Lb)nK9eB6+56*)cX&l;|_$)e% zUWMvbqNu5O80?Ei(bPRlQMSJyUT(AD!sD7q3FX3YKR0&Cy~56y)P)mfA-rvm92b1K zMoH0C;FlZ87JV(K=d^D0c@qnxYIRWBa}S)db>wkg0&i%@6ql$e!@&94_~nQdU)KewUFxGgBzG@lzA)F>$VAcs87qQ~`$^!#fs9+|xbvMP13W?Ku7g~4oi zwg+}UagZKWTw}AJ${48Z&Ifm|HxxeHz^Fyw*UnXQu zWrEZ_c!peg>#5shxTj2_I%73mQ;Xr;5+%H^u#aZNZ(?=hL}5g!32bS4PCMR?!rfOb zm=%>+&%*%2)F)!+7j;~F>YRA>2f~MdQDW-yXF{({HPY{DNg($qRw&vQ$90#Yd4=Ul zE;W5lOI=rC`|dXJzt~8AV;RUMv#ljP=WEg81PRQ@{zGRXmecud_K-i!jA0>&Ep3S9F+FWDx#|Z+l{}#Fk@`65PH%V_?L@(Uuam>5 zT{LFQQ3y+#&8uvTaN^7uw3*W?RCoJT`+MICOnfy6yDtlD@z(j}WXIFpq-FHdA9|4@}yu!%Dm4 z#4X?2VfFJDP?@xrv*KJ>(@#n~$clezt`qdl4^V!8ZI(~Xf{Yivpln=MUPNmHI?6P| z%0>4f(Lje=8ci`N(E&_GU!h-xN_^$7Hvj0I%Fk{EW6A4A$p1Eph85Mr;Ay2@IqY53 zy0aG!jWpxEJ`y-kW{R%QB5+s8Q}{K%oC6lQU_pNH$YQRc8so)S6jUYPcSqfY z$Eimb=lK%-ohsA2F@C!z2As6PfiIgu_VXybgL|n{ITbs$cv5UwCYyb@0x3I;_^`%j zy69HPQnkGl&x*b`uNT1g~T&_I9>ZYn%gy_`0T7}pi%FON6-+Xrd$=` z(~#v)hGWEt(L!^y1z&smosz;nz^^XOdG_lkj1BlBKJ24}?H&h(y4Yf2fvYciFH7Sl z+oLEwREgt8*po{5EBMyoPsvC9!0t^DDV`7H^)DVvBrA5o{J$e{-S}$WZF@w_f6*KM z$yxBAk3IN@{6zMjkji##eXz}89xA?DEv$--g|J2E05^9|N_@qoIsdc5O)8X1Mpg#NzMQ5Py#sJX8If*E&*R?7c;tYYeOxL(5qk8 znDIHE42EjZeM570jNA|U%Ld`yLB}EH%RD?Xbu{iNeM@V zJ^vIKxgVfSYrF7fAEx*Vn)vsVDfr7j+p6=_x5K=5>IWw@hgY& z?YdD|e^3n%<|mPKek1B9t;dcq1Kd7(3$Ho5Qv4*%r&Ya;;p~;|?EPN|Ot=yRbVrAk zx9#RR2bw_TP@d2+Z6L0z9WG{>R>059Rj}DA0}5wsrfXAXuy4;3@H=Y)>y6LBz7jiL zQ>THeJ?${xqJsW>@x)D^wZZu70$zI&ab^B%IC|Rog z&N|?gbu;;Mz8ai0_Tt%UzWhKTl@Ht;g)95qg~ph!-0z4iei-tXzH51)P-Tg8KI>!g z=mOS1X~ljUjn}PeS7dwO^RE7Pesyo`D6_+vD~i$hYgg7QEtR4yby;az z1^LvM(f18wsY6bV2f1!UGutdM+dGFNr>4`w;0XSp*IU%oK0~LQ;AK$ z5UpT-U4EOs_ZSWPKicw}@3wqcxhD@*jO{v8rgC^~1;#Y&B87jaY3buBRO!}}l!tVa zKBQ(i9BR(-n!)_#Q`b8lIUA}9|Es-PY>Efv%D7`qC`oQvVT0Lja!4D`G0%!&@f&}L zsPekZ==rFK9J9LeYF!-oNJ$F#4%+}H zrdIKG-V5L-4S;`T?2g_FTDyi+%dPiG{<%&pfz|8D{tXHQ4f zq|dO&ZwkePltRth{iG7*0CPti0JW}XoB3%lU0IsJFLc5{9DIUz(_H*}fM9IxJlJ_d z!gnY9fpg^-C3kjqhlmm)%PI|48SoK~yy}C}XYrgeRh{Kze&Nge1{~~cis=cRu+wNL zh(Z=CF5l#lBQKq<=Gf#vi}jU^(Xd#K6aMr@L0K32-yVe@ z7OJx0`x%({vXjR5s}bXu*FwOQYtl`&^ZB+-B1{>CE>!EsVq8|@WI?xp)8_^e=JslcZKIfSC?e$`z9QA-c}QqKgkCd zMPrOuF$>=hH>a3EGk9&lD$;N(Ca)_Wq3u8?46>|;3F!j&fT_ac>n<3#D+73B3J=lN z!>#^G9Cb5Za^UHG7%$tCYa)uUqq{XG3uvGgIG$~A(4EBkcqo5MKhwh2POLUuXo!;e+RaPPWeVT8>d zy0hDx+=pL*x|#1N_;(yD8egHuGcVEgu1xat3$MgDwJxq^HjQP?9JqbfT~e8>g=ZCB zL!WR1ToZQ)#_iMMH@{=3>Esb~&1m4X)wdzOm8iK*9=DE~j`7D%)2u~Hhp{bQYDL=<0byXp1g z#5`>pcKf`zt)Xi_T=B#e9lvS7-FONe)lbq-#v2u$`mt)N9G$t4$V>Y7#m{^*R~0ldn(}R4lgiY+l{O3-Fe`$(Jao?#YLAiu$z@K zg?}AHd7+=F>U2B!>=r2WU{aTk=ZQ;eH^7Hw&Dhj@M|$5m3ZqpU>HI5Cex`k1j2^6n zZ<`b8ymdbG(9jpZ)OX?R!*Y0_WS4NOxe#9IYVeoMQ}DNJJ}*_d1`+p0^Q412k$3MU z<$!7MV#7q-I?;#C2d4;c#_937D;LnSXbJb6e4O%fi(tv3GobTjH0L?4=8;Y|Fztv8 zHz+4b_a7-1`LdbBYD#~u7}1|zX*w0XicN1S5gOIZfJuutBREfVHNwcSv2nJ532oyd7|DMDg5AMCw<5Ld?c;0HGsvQwCZqZU?EmGcVx zbbbq#8}{N|`({w-q`o{@)j^oRHoUUma=PSDM%A?|sXb>L&fAkLu9#L1dlzlQK-XYl zbaIgxdtF;>TAw1#`>qOV4trprRFT~_XQ6q>FL=55s(8717%r=}0tbZ*P>D-pE6Wo6 zrBa4lB(~h^a976GXAW)7`zp2%RKUZdzJO~l6^tCOgWFf0hY{!BQRs9uh0tRaavt7?B)O(f!UKtu#-{8ox%ZDKLdQOW}PxDUgzIZFr zgy*k&N$0`?IlfYaOoiimZN5&}=rQ6#s#`LImU(Qh z=7w^9%eXbf67L<-;a}(aP{M}2;6Gl9n(rq;*Nh0aPN~7N^# zmMlx_Cyi-HgBDEA78zyi^{duKoappFuEZLjid@`EtJXFY)<1Ew&Ar z&xJEmU|}CC79vZyZlVeI+d7hOB`Wi#kJl;5QIWqZoPxNA;kc!b6+Ztxgz(EkDm7k0 zRd>Wl)31zY%How?-D47Rthh|-qQ)=xtKojI7z~fqsoAX zu-<=*;6+lgrffLq#v&J6jUyUw!mi6ZMAK)=+*AI9I4)^1S}B?1{ek|de)BB+4NIsU zf4UAF!;QK;jD4bMcq#d1tmpfZ^Adv{rvXcLz)fEZBx6gIeR3VGr)c5_U2C+=m%~SH z&&j303k+vn7PAHke9ZO<)ug8I_mZTp83#*TARUGvxX{fz9$5dcQ1CNKft!x~U}?ou zf|@_VQr#-tZqkkVojpWVL*I)>zbEqO{tk35Yy$QQ83335YM|kS@qB%_40R4YBH6QO z2Cs2eK(U0)8#R%8drxxxpC6 z3@8=0Pq{{}7ynS2+)n&__Yu@5KNIh?I^x!l>AdydW!U{Y63(S`L;I{hWIRs~GaHTB z@bMnF-!&Kh*mVNCef|mcJ%;nP&}wknFb5C!egV>k&#>sib|^m*!2^#NsH(xJ)3z89k^-`g^tSjI9S`U6od*YZ|y3pLZj2DR-;C|?THE`yCJ#JkXrZlNEP)S9E1{6j0 zebz#QB&Eqrq{vL2WbRPXEEOdgE161zDSFl_5)!BMMwyl2P!5?wO1#fMuz%Q}z4vGD zdtcXGA*#Gi#Jk1HAiw23<@~t|Ib9hr|BMwI>-VMWO{3wPLOqqZ6q9$N9p4kJc-q&E zVu$HsR9*g+PkM)Nuu~^>ic@Kz>p_bB+kppueFXm$3>6<=8iH#Ad}Xt-Q#4I}LDNlY z0eZz^&v|o$_UGVpC1iGG_vsznD(@xvM4s$9 zBn7O}^++S?U%2)qf~|Llg4x9O(#?HL@YZxQtaKFl(P;)-i6Ft_gsa+V}lwS-7s;(Q!$r<&u%ty{><@d11yS6Dkm6f8eK zB*H>Ek?KaCzTMPox&xY2N}g9?PqEX>fvqO+jJh{w1)Y*Y z*%dJQ9mDd9EPkoGlXJ4Opfpd)s?z)O{zc9_wnH0j>*Jt3XgUAZI6|{#$l(&Z8mj6& z<+5L*KP}IlM>}8Wp>xJ{kTbKQ$3=0v&M6qR_dnWHR!F}3gRsl{9_om@xJT?! z{8%J;`t2I%cU*-%EIcs7b|n;go`v3LiYP+vER{cu6XR}W;M$01Lhz~!;`4voaO*TJ zvB$AG>8~Y|zRga>*nUgtu%;ZA2e0OH=W~UEb$@Z9qaxj`G{gHFl<~lm*${d>lE>Vh z%$Z}i(2_oucy6{cr65#W}^5vL{N@(dK+#sLRomoW$#J=ez|^KbOO6G;fpZ_jY)+td*+O z-wN*xmqBxW6E)0K!^-(5#gM{CvQPa2imS`0@aI5S`Jn<7-kqge$2-9@GKc@`)1!3K z7)4&yIt#0d{)V8$Xx6FI!}5@Hy4QFReTMG98?mWmlYJ5CS-Rceq}}wc<%Cd|yA(U4 zG{GnBG#g|qlh@`qVq#{-4EkmoEEK9Zo`oD^6Gs%p8R_lsP6nux|f}(t#%aO zn57Ok4Hxs0VR~3*VT%TLC$mac7^gK3<-FBe@Xo9q6t9fpJKg#?OQ%fe>tw~l4@ZHy zLI5WO+^2?i2ULygL$CTstnQv}tSOP$Bl=3~7fFu2NeZUvhT`%AQds&}7rTxI^5=%{ z0HbX(wI4p>$BVGV5U9R zjBPD#tw@GREl+7=QVTgtd#lzv9!*r{@>z*zyV2pv8g4^i`X_aiuYW5T^@_&1{dIZt z?WeNs33}YqLh4(%_mDy>X7a2J*LmUGY)YLw0Ztv71gUl5TnO3Cs`mz@XoDyl6%}W&V@PhVSN5SzAxE zPh84@s_ii0 z0ta!C<1ltla-x8#$U=FNB5#g`exaC+X{h(3KjKYeu9e1&+gDlI<=9tLXdi+Brj0zH zR$^JoVyJD73w+a&PR0T)OtO;TDj#AfP>A8k9S?T02UJ8Z)B=qDajeIRU|5>2U%ThL}= zB_+RpK;}6TFWEE*YtEUV>G3}J!J!Vc>JdB5O3BAr;WuHP!v@R+cKlznbjge z%b<;>UG+qhnGr0nVh#H<6#3h(c)0R@Fb9raO4YyL2rhQLS!eVic$JaIS+h&Uu@`@p zu1$!?-qBjHIi#M7=Z|5nsjuIF3UxK^;m3-zkmiSm%hCV%4i5DOD!f{jcP|ewc z77hMDHDT-Nw|kwKs5lTWyKBqzCL~f}%|!mS&_mz<@a!@J?| zvVrU*`E*;`r}2{^H^_8Zkua!<$mo&unH+G8D(ZJ(c>ZuqnBva?U*p-Q!2&KGa7Vod zqq(uA0y?jlU`5|#N?GT{a`R0wc$xvk#;m}GIrI6^`6e2uQb4XLD0P{D=a?5om3W^KTl`_=eKb{xFO zDiPYm3;d!+;Lzd%ZkEpn%UpBREO6p@|0{w}-A`;b_2iO7Y5k0d!iqsLxaLalrxI z8XRcv_!z2-OchU+MNv_#9hNEd<(PHWtZu-#I9i@-JC~u5WQL-VJo-L5K=%Dj#HU?e zJk&CUj@nKK{RcXH?Wh61S@1?Wk8NmATRd$|OT%%C+@RMwJjmKTIXmWTCpUTl3 zZ=}~OJWjL1;GM0s#HF9?Pp1J6*;7CzBh#_CvydfZt~5Ak0bhL91p2Zvm?U{#m-C#k zwqPn6`pqDZ7lA^xgTNi*7D4Ik5B4cT%SA2M2jYNuQ^Cw}E%x}w410dm!R?WU#98^{ z_&&q9ZVb{zXw2l9$5iIAfsL)Tuuq~Op7=GpnMt=N!Dzbpei z?+!YcYR(^iy{Ezvd&IZ~Rmgb_Sfje1x`GTzLCqZPMqLo=HCG8HMr)I|rc z7Ki{PD6~E;n|Wv``>9EJNy;j2+Uo;i`yN{JV+7aeDkFsw*?9F9Hbnc-(|w(yu2p|L z5p2k=4&CD9gi%8O#%&ySEtBVbp2QxhW3g&Z6&?E%Nh%HbJTYJ&sQq!m%k!QKA)Zyl zueQVCrIT?^y&E>Q*6`_#CXhNcgTiyeS*cOtF+jDxO!l0bw3}FuALcSR)v{jsGY3Pa45XrWsLA^+3s$9*NRzc49hefL(dPwj`leTS2iks>=a7YfFE58>>> z)um@!zmxV9D}FV@09TK`18G)jyt(xqZQ8pZWkZ^%de;g3c;_1(QIAEpEk^WLaT6|_ zuE*_R7vXTSjEB9uf)3_KFs-YKZVZ*-0#V{^%ct?KMyW?&Q8g%@9*OLj0yIDg58K*G z{W^tUHn3BC{%MTx?+krB(sWe3nVl~4&5oncFB5R3TQq<`c+z_t>f|1RCSyn5mk@z} z^4e+h#~jR(tAsVrOrb^52qR>R(aX8?)nD7FnKT!@V;U8l&l9ms-> zD}p#6-~it++Qs%eN=p4E8M58_8qz&uM5!(n@LoTLO>S4fg6-9GrOqB#-8~7mW8J{z z*?H6%=D^3_YcW*l;1i1_wEo#FHuJs&+r4j!_FB\" if Response A is better, or \"B>A\" if Response B is better.", + "fields": [ + { + "prefix": "Question:", + "description": "The original question or prompt" + }, + { + "prefix": "Response A:", + "description": "First response to evaluate" + }, + { + "prefix": "Response B:", + "description": "Second response to evaluate" + }, + { + "prefix": "Reasoning:", + "description": "Your step by step reasoning for why you chose the better response. With verbally expressed uncertainty." + }, + { + "prefix": "Label:", + "description": "Which response is better: 'A>B' or 'B>A'" + } + ] + }, + "lm": { + "model": "together_ai/Qwen/Qwen3-VL-32B-Instruct", + "model_type": "chat", + "cache": true, + "num_retries": 3, + "finetuning_model": null, + "launch_kwargs": {}, + "train_kwargs": {}, + "temperature": null, + "max_tokens": null + }, + "metadata": { + "dependency_versions": { + "python": "3.13", + "dspy": "3.1.3", + "cloudpickle": "3.1" + } + } +} \ No newline at end of file