From 1700d618e5d02c7b1ab42e5b1390f972873f59a8 Mon Sep 17 00:00:00 2001 From: Daniel Rammer Date: Fri, 15 May 2026 10:46:44 -0500 Subject: [PATCH] test(python): regenerate lindera ipadic fixtures for lindera 3.x lance v7.0.0-beta.9 bumps lindera 0.44 -> 3.0.7, which changed the tokenizer config schema (dictionary is now a string path, not a { path: ... } map) and the dictionary binary format (now requires metadata.json). The old fixtures broke test_fts_lindera_tokenizer on all platforms. Lift the regenerated config.yml and main.zip from the lance v7.0.0-beta.9 tag (lance-format/lance#6719) and update the lindera_ipadic fixture's config writer to the 3.x schema. Co-Authored-By: Claude Opus 4.7 (1M context) --- .../tests/models/lindera/ipadic/config.yml | 3 +-- .../tests/models/lindera/ipadic/main.zip | Bin 2450 -> 7250 bytes python/python/tests/test_fts.py | 3 +-- 3 files changed, 2 insertions(+), 4 deletions(-) diff --git a/python/python/tests/models/lindera/ipadic/config.yml b/python/python/tests/models/lindera/ipadic/config.yml index 6b3f0af40..922768bdb 100644 --- a/python/python/tests/models/lindera/ipadic/config.yml +++ b/python/python/tests/models/lindera/ipadic/config.yml @@ -1,4 +1,3 @@ segmenter: mode: "normal" - dictionary: - path: "./python/tests/models/lindera/ipadic/main" \ No newline at end of file + dictionary: "./python/tests/models/lindera/ipadic/main" diff --git a/python/python/tests/models/lindera/ipadic/main.zip b/python/python/tests/models/lindera/ipadic/main.zip index 4db1bab93907f925de36e4361792d3b540b1211e..ee6791dc408a7cd73df2e36b2ea7c12c7c5b5418 100644 GIT binary patch literal 7250 zcmeI1c|4SB8^?z+X%dFA6_e`NQkE=@{YXitvV^2Cl#G2JGqRJDUD;0=V{5T5Lx~yd zI8#bg#H5!&C`(ApFwDH8lMbEF>Fxj5GoO2&=b6tu-}`=k_kG>h=ejQAQ$UVwfYrn4 z-hHbt7hk_X08xOOos+w~xfvJ$l;~e^T5U))7l4gpo(%xt*va~%G3)Ww^VTnqAFT4Q z*~PkpvKr6YM&?9@U84x_@E<)Z1cM2~gq4qBATK&QS&h=!*=Y;md&fF;QXnf8MGwd3 z>*Wb}vj9%GHuWur+D~8Lv5ZXJQ-9U$YO>gCdM1<6pxrZNpK#}}R6r7;0KLz@OYM*6 zkAf_vvV5&k^IBw7?bzels)s!VBH^GscY*4ix&EpVh%959CdsdtgB_ePC35TkGRZkrhb+ z6BF~iONHl3Ob}g`DtVHkdJr_3SRZA=oP* z{H&oYE8sNj=VPC-FN zVU3RGxD&nmC+!v#0;05tP&Kyf=aJFxcM+2wGkD%) zr%D{x)#pT=SCLVVd*As{*E&2fNb7idl%GGH5eQX`&hT|M)z%DNCTMp|`}b4L1&*6+ z&jt%ONs2c*l!G!tMU;VDVro7uyga z1&bxOOCd1vnQXE_!(rE*`no-t_b<*&ZPzWN_9Uh*WfYHlC8UPW1QSul4n*Hsa26aPA1Fqh{zJED*OD5 z8LECkaSOw?OmygYHExXGtm8@Wlz8`qE!@zUV7M?$FR&4!Qz6|GrKKd9hS(LSluva< z^jK2{)UQXiZQyA=LTH3qo`}7>=ufu5n{|+~5=;o%3vtXH5*kHwmmVHHM9X~DuA!<2(HoM}xK6e383^Lo?H8c^D=e9HTcAd^5T zd&3)?*ig0>&j^@7_$gbqK)^sKSjZg`7v>|*)gRu`7#`HxcrAO*JlOjpVezO;J>Ix} z`E>L-Y{Ma^N8zf>+TfFzM>fy@!yGovdh;^v6%6#r$?02m<=xei1f3T^W<v8r9& zTVQ17%LVn1&U!Yr6IbVGiL-h=Bhw5%Vo8*&j*MaH_>yvcUI^R9)r}v$>m$VSNF>$@ z=U-dhZdZKm?CpH*z%mM*9fhI(&K zrKA-yF}Mi+v-`r1Z8=4)7aFKbHj2%aKBRoUUqGTd+aRsyq@FBh-$kjF!NuT3TGzxj z6<^61)L7~bxnrsai*_?4d$SYb+=zNR^Lx!oUQa}~ni5vp^T6@^0SeYU=x#*k7TzjF zY5QJWaTCWgalDD_<4Ww3XY(Rs^u=Y2M@C4tv2fVw4C5@FBpfAi-{V87jh~6)$TOBn zbcvn<>oFCBXE~LgYV&~LXX-cb%{k7tr09!6`q8mv`MI~uEpX#gR6)Ou0`ZmLSR5dX=d&pG?u^m}P&vk1?S3@o zE3X%mA0vf1XQmJ1R@lz`(k9@YqCveWx|fP6vf7)vUv2-+*xq<#v3bJL;_8VQWbuB4 z?|tca(x?>KhixcSy^@VmkVC&xnSY07M;TTs3LHKV&TJ^>IlNDv+vmWi-xZ>7c3eBj zJ7{Yc+K=SpUzwy%e zH0o&ax(*_#{YlhePwNv!-WA~>xy;=<33C)FPn%3$ooHq&a@}X${yt=Jw!d4ahzE;^6BVZui)}!G#)NFbGA&cp~0{P_1P{J)TG2 zicuT2yyTbFKgQE3^)&9cybaL<%^t%HGyodKIf$CEU6zA}UmvnV!=Pa&hNv^rn!6ej zNt6n-C<71@MH&Xfc#Me2Gxp1TS>gAF(3zn+f4-XWox~mnb`Wthu9??X;7PMq%V5UN zj+VJuc045HcO6pf%q2WWNLc#N6&OgKRDcEQ-4h8;OB}Mq__5%S->8@UWt*e0k zs;m5?rm~9qx2nn-3INCt(^*5UtFinXb7LK4Ju_#Gxv{G9bJ&e}=JnWK;MceQmUaF) z;>O(GU&PfkPkz{gEnkV>W%_=OyD_1)exxE>zjFWH3%{hdevZ2_qqUyvxyE%{m*4t1 x=*F#jJ#bF`#I>wjdVRUPjEeSbzA*6B8W8y005Zv`OMmq4MbM&{tGD*O-TR% literal 2450 zcmWIWW@h1H00G%e&!fN$D8b4g!;qVpnWrBb!pXpV@tTSKn@tg>`Kl^EQ(J_ zP18%t%)@6L&`XTej4n3&}kI!_O){hOb>eP!tDYo)hWPOIDK|8D2= znEOXO`&-(te$}$9-C23}uU6RezjxiM4>>LUVDqMTMQ6eufwpAdr&WOg!M(rh45enS z;kV^jl-b+4>-wj=8o{h*1E01WTyZ}r^y-bS?5vnTuemSuq_qQbE8}!$J@DK1N8!U= z{!O)00y(d*=l;4-{(6D?dWPVNw(S-DmVXY})V2RM>%N_HHaj|nb&_~w+lEP#t4#ME z**lkQ{e@#SH*_3?=a)XdY|*?~$zSogMt|fM#pkZq6vZQ$#T3K~J7rF!#vBZN#5mFQ z#DWv^51#WC4RGP)d*`^Y*K$ol=>0#XSlWh*V z*BlbBxw@18WxrsEVXx$#1KukPCo1lcICkG%>Hmj!yubV8@4wuuVzlAR+Jvb2*Kb&# zIS`e;zL2Z-#qn4TpNE$F7WV#+aQG6tA?11E+s`?(@{d2-lelL>VazuR`}7sF&HBFU zN*~jfJnsAV^1JF=7TLC!t9&1`-+jO0_3_WelE>dh#GTu~XRUbN^MwDaXp^4lLC2Q; z%=~VfdH>PxCn{&G&sm@Io?L$8{P()~%$MJn*3@15|8UFs%1c#dXlYA)rqn(QU=jym z9$4Bc&C4bxS?K`vfPn8rYrn$|5-rJRntJz2oH4eM5prVE5D{ZB5ai`_G4U`dv1BM< z)6!DXbKsOM`QjlWB2vKg&e2);*uAS2^)Dy8-#<%g}Wtc2UIu?ip*d$PPkTZrm-@Bg*!n|NAkJu>wGVDCe;m0 zrxqlwS=*!)!E749{<ixG-?|^Fz$B_)_JY@6^K+Tz=iO6O+o#;!mh-1m=Txo~Te{7o=QB1v zZ`t%)_>`T{sVes=f5S9in`TzrT;gb!sgZY~V1xVNpQi7>$p)5*2bTped!x84XSH8s zNK&r-decu)=Ig&^XTFt3Ek!zCsx^Vi7I7dJf`vY~6e-UyN-54vslb=DK_$t9G)PIp z>(jqRp?BRUsSWQq_Q`OvADXv8RfeOR-y%)(hf47O#x25?|LP{k zZ8|<@2)sS9m)9+T!R_Jaz2^4?ycT=#EHG$eoZ_|A$#wCPMIxQNYaZ$cYD|46(e=CJ zd4R;VkerUc0$+8XT`N#q)Rpu9A$z1;my+?DjT+*HH{RdAADg7bdt14R|Ck%gx5pOe zp6?CtW@M6M##O^fKpep!!0^@)#Dvy&tdRN+t&V~ig{!uM8O6Y`q|qK`6jI#>G!sj` z2Xh|wS`FFE)i5(r>p0?!MJ>>fjb&$s`Wjxm;WH88dDKjbY+@@5)I>yb24`8q=3-_} zWOJXw%tg+sKtr*%N+6LA3suzIhHPjiD~4l3L-4s2SL#PLRF4hWP*7gLWg;t3B?GYW N#KABJ=+*~d9sp?rIfMWJ diff --git a/python/python/tests/test_fts.py b/python/python/tests/test_fts.py index 5fa64c14e..614d81185 100644 --- a/python/python/tests/test_fts.py +++ b/python/python/tests/test_fts.py @@ -116,8 +116,7 @@ def lindera_ipadic(language_model_home): config_path.write_text( "segmenter:\n" ' mode: "normal"\n' - " dictionary:\n" - f' path: "{extracted_model.resolve().as_posix()}"\n', + f' dictionary: "{extracted_model.resolve().as_posix()}"\n', encoding="utf-8", )