Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Empty matched_tokens when synonyms matched #1751

Open
Ku3mi41 opened this issue May 24, 2024 · 0 comments
Open

Empty matched_tokens when synonyms matched #1751

Ku3mi41 opened this issue May 24, 2024 · 0 comments

Comments

@Ku3mi41
Copy link

Ku3mi41 commented May 24, 2024

Description

Empty matched_tokens when synonyms matched. First lerrets of word replaced by empty match. so they just disappear.

"highlight": {
	"title": {
		"matched_tokens": [
			""
		],
		"snippet": "Вспомогательные <mark></mark>етоды для работы с операциями ProcessFlow",
		"value": "Вспомогательные <mark></mark>етоды для работы с операциями ProcessFlow"
	}
}

Steps to reproduce

Schema ```json { "name": "guru_data6", "fields": [ { "name": "title", "type": "string", "facet": false, "optional": false, "index": true, "sort": true, "infix": false, "locale": "ru", "stem": true }, { "name": "author", "type": "string", "facet": false, "optional": true, "index": false, "sort": false, "infix": false, "locale": "ru", "stem": false }, { "name": "description", "type": "string[]", "facet": false, "optional": false, "index": true, "sort": false, "infix": false, "locale": "ru", "stem": false }, { "name": "type", "type": "string", "facet": true, "optional": false, "index": true, "sort": false, "infix": false, "locale": "ru", "stem": false }, { "name": "website", "type": "string", "facet": false, "optional": true, "index": false, "sort": false, "infix": false, "locale": "", "stem": false }, { "name": "publication_date", "type": "int32", "facet": false, "optional": true, "index": false, "sort": false, "infix": false, "locale": "", "stem": false }, { "name": "embedding", "type": "float[]", "facet": false, "optional": false, "index": true, "sort": false, "infix": false, "locale": "", "embed": { "from": [ "title", "description" ], "model_config": { "model_name": "ts/multilingual-e5-base" } }, "hnsw_params": { "M": 16, "ef_construction": 200 }, "num_dim": 768, "stem": false, "vec_dist": "cosine" }, { "name": "synced", "type": "bool", "facet": false, "optional": true, "index": true, "sort": false, "infix": false, "locale": "", "stem": false }, { "name": "selection_readable_ids", "type": "string[]", "facet": false, "optional": true, "index": true, "sort": false, "infix": false, "locale": "ru", "stem": false } ], "default_sorting_field": "", "enable_nested_fields": false, "symbols_to_index": [ "+", "_", "#", "&", "%", "?" ], "token_separators": [] } ```
Data ```json [ { "author": "ЦК .NET", "description": [ "Область применения и практическая ценность Решение может применяться в проекте NoName и других проектах на КПИ. Реализовано в виде .NET-библиотек. Используется для упрощения реализации типовых автоматических операций процессов ProcessFlow КПИ. Обеспечивает автоматизацию следующих сценариев: чтение параметров процесса и передачу параметров между операциями; запуск бизнес-логики автоматической операции с автоматической обработкой ошибок; ограниченное количество повторных запусков процесса в случае ошибки; протоколирование ошибок и прикладных сообщений; запуск операции в эксклюзивном режиме (единственный одновременно работающий экземпляр в рамках указанного контекста)." ], "embedding": [ 0.41903531551361084, 0.2947993576526642, -0.2216949760913849, -0.019089363515377045, -0.0003124054055660963, -0.3878582715988159, -0.13760031759738922, -0.10092748701572418, 0.17418797314167023, 0.25963059067726135, -0.42735543847084045, 0.058903466910123825, 1.3473308086395264, 0.1188976988196373, -0.21518877148628235, -0.5083199739456177, 0.429482102394104, -0.36568960547447205, 0.31955686211586, -0.523123025894165, 0.006062449421733618, -0.4151917099952698, 0.5499478578567505, 0.2617396116256714, 0.3967045247554779, -0.3491171896457672, 0.3104780912399292, 0.30126649141311646, -0.11653715372085571, 0.3764599561691284, 0.3187389671802521, -0.3037787079811096, 0.3848152160644531, 0.16959761083126068, 0.3431411683559418, 0.3704778850078583, -0.17892341315746307, -0.31347426772117615, 0.2764337360858917, 0.05075032636523247, 0.28042230010032654, 0.2529549300670624, 0.4535100758075714, -0.18175798654556274, 0.370868057012558, 0.019136276096105576, 0.45960891246795654, 0.048737481236457825, -0.12797653675079346, -0.34415945410728455, 0.2451990842819214, 0.2760298550128937, 0.27947893738746643, 0.09594414383172989, -0.2013443112373352, -0.44333988428115845, 0.1844104677438736, 0.4559485912322998, -0.487687885761261, 0.4625944197177887, 0.20689450204372406, 0.5598936676979065, -0.28016525506973267, 0.06945764273405075, 0.11565692722797394, -0.4034501910209656, 0.5042866468429565, -0.008455991744995117, -0.10757344961166382, -0.16502664983272552, 0.2028828263282776, -0.27564284205436707, 1.234086275100708, -0.7085610032081604, -0.44571036100387573, 0.21523815393447876, -0.33980870246887207, -0.05866270512342453, 0.00844547338783741, -0.3544773459434509, 0.3717615604400635, 0.05762495845556259, 0.020793437957763672, 0.42422565817832947, -0.04394996166229248, -0.12485601007938385, -0.30652984976768494, 0.3463934063911438, 0.18091259896755219, 0.40206506848335266, 0.37051036953926086, -0.2669210135936737, -0.46156150102615356, 0.4112643003463745, 0.3781168758869171, 0.4283016622066498, 0.33554723858833313, -0.03713853284716606, 0.21715763211250305, -0.2565409541130066, -0.14815257489681244, -0.8405080437660217, -0.3060411810874939, -0.35953328013420105, -0.858472466468811, -0.23905374109745026, -0.018690384924411774, -0.3927989602088928, 0.2742723226547241, -0.6221187114715576, -0.36534979939460754, 0.6489103436470032, 0.3644448220729828, -0.24714510142803192, 0.13856863975524902, -0.4691120982170105, 0.6479092836380005, -0.4327823519706726, -0.19020017981529236, -0.44916725158691406, -0.44297102093696594, 0.22936956584453583, -0.27986007928848267, -0.4272363781929016, 0.4046412408351898, -0.17547622323036194, 0.39192458987236023, -0.06298153102397919, 0.3082367479801178, -0.8422616720199585, -0.22075249254703522, -0.5982853770256042, 0.28352826833724976, 0.08801016956567764, -0.28181830048561096, 0.2792869210243225, 0.7048195004463196, 0.23829612135887146, -0.08879301697015762, -0.10089676082134247, 0.2915865182876587, -0.4141574800014496, -0.037012822926044464, 0.2056417316198349, 0.1991194784641266, -0.634017825126648, 0.34219494462013245, 0.12788285315036774, -0.5035863518714905, 0.2501996159553528, 0.43081313371658325, 0.0547359362244606, -0.502253532409668, -0.12694963812828064, 0.32975566387176514, -0.07594045996665955, -0.4674229919910431, -0.057510729879140854, -0.05422244593501091, 0.06742505729198456, 0.26046496629714966, -0.031940706074237823, 0.41519537568092346, -0.2933230996131897, 0.6399680376052856, -0.07997147738933563, -0.4087536931037903, 0.09967352449893951, -0.600504457950592, -0.40041419863700867, 0.013245740905404091, -0.45415401458740234, -0.9650384783744812, 0.1605059951543808, 0.12974652647972107, -0.08873924612998962, -0.4141572117805481, -0.29689982533454895, 0.294988751411438, -0.08406643569469452, -0.5106198191642761, -0.034105103462934494, -0.35225290060043335, 0.26681074500083923, 0.09540796279907227, 0.2592088580131531, -0.35876384377479553, -0.38279101252555847, 0.3393508791923523, -0.16053812205791473, -0.21201393008232117, 0.6803915500640869, 0.36252090334892273, -0.22437754273414612, 0.07704644650220871, 0.2540169060230255, 0.20594672858715057, -0.04660394787788391, -0.30043160915374756, -0.3779967725276947, 0.054488733410835266, -0.0869474858045578, 0.045123688876628876, 0.1347946971654892, 0.2043357789516449, -0.3915671408176422, 0.29942989349365234, 0.562964677810669, 0.13987264037132263, 0.46240198612213135, -0.2949143350124359, 0.6398496627807617, -0.3134642243385315, -0.15388227999210358, 0.09083911031484604, -0.479992151260376, 0.4269832372665405, 0.29689857363700867, -0.21989622712135315, 0.26964735984802246, 0.367217481136322, -0.7629056572914124, 0.6086081266403198, 0.3476240336894989, 0.1365099400281906, 0.07161955535411835, 0.11942959576845169, -0.061079345643520355, 0.04365915060043335, 0.5355948209762573, 0.16872958838939667, 0.4960315525531769, -0.288119375705719, 0.5902898907661438, -0.019921164959669113, -0.06469420343637466, 0.2050582766532898, 0.1613631695508957, -0.3890109062194824, -0.6644212007522583, -0.30794796347618103, -0.05628543347120285, 0.20818448066711426, -0.24083200097084045, 0.20302622020244598, -0.5203245878219604, -0.5828692317008972, 0.2220071703195572, -0.6706073880195618, 0.5155274868011475, 0.15780586004257202, -0.4871072471141815, 0.27644869685173035, -0.3554771840572357, 0.3962579071521759, 0.1950732171535492, -1.0519007444381714, 0.058315277099609375, 0.33363622426986694, -0.2854444980621338, -0.18084606528282166, -0.5699899196624756, -0.052419908344745636, -0.06833101809024811, 0.5727425217628479, -0.24237953126430511, 0.5385857224464417, -0.3105829954147339, -0.14825168251991272, -0.21065481007099152, -0.00015378347598016262, -0.43046143651008606, -0.3256776034832001, 0.048057347536087036, 0.019440028816461563, -0.153400257229805, -0.09230044484138489, 0.033132754266262054, -0.4766351282596588, -0.09581626951694489, -0.1342257261276245, 0.8347904086112976, -0.9049840569496155, -0.17989376187324524, -0.35009366273880005, 0.16221387684345245, -0.826106607913971, -0.17478631436824799, -0.6457303762435913, 0.15670610964298248, 0.5014235973358154, 0.23518037796020508, -0.36122575402259827, -0.22882230579853058, 0.5354677438735962, 0.3053086996078491, 0.09763763844966888, -0.1906307190656662, -0.39454296231269836, -0.45282822847366333, -0.059934139251708984, -0.3002924919128418, 0.6589397192001343, -0.3843908905982971, -0.17304126918315887, 0.1475815623998642, 0.8014636039733887, 0.11543800681829453, -0.610419750213623, 0.1445508599281311, -0.3317123055458069, 0.004496673122048378, -0.14291538298130035, 0.21656522154808044, 0.14095304906368256, -0.008210157975554466, 0.15165728330612183, 0.7594878673553467, -0.19857589900493622, 0.20781297981739044, -0.1804226040840149, 0.4597885012626648, -0.5488624572753906, -0.536964476108551, 0.5223797559738159, -0.019600188359618187, 0.07890485972166061, 0.24637368321418762, 0.19196946918964386, -0.002268910873681307, -0.12392868846654892, 0.40915384888648987, 0.27402570843696594, 0.2700900137424469, -0.8812499046325684, 0.21296043694019318, -0.5582321286201477, -0.6242333054542542, 0.2591637670993805, 0.2017979919910431, -0.26973673701286316, 0.5164321660995483, 0.16235721111297607, 0.20629549026489258, 0.5701379179954529, -0.6032457947731018, -0.19471512734889984, -0.19419971108436584, -0.49861472845077515, 0.18528279662132263, 0.3705073595046997, -0.47995948791503906, 0.27442654967308044, 0.23058173060417175, -0.18771977722644806, 0.2906602621078491, 0.1685466319322586, 0.29936903715133667, -0.26744335889816284, -0.008963962085545063, -0.30146700143814087, 0.4312657415866852, 0.05468887835741043, -0.21554270386695862, 0.1412978321313858, 0.07750192284584045, -0.3687553405761719, 0.23594234883785248, 0.5578093528747559, -0.053059857338666916, 1.0040816068649292, 0.4605634808540344, -0.22153878211975098, -0.19016678631305695, 0.31749001145362854, -0.18276044726371765, 0.5661104917526245, 0.10362952202558517, -0.013654154725372791, 0.33269721269607544, 0.49437347054481506, 0.3529300093650818, 0.13817627727985382, 0.15752892196178436, -0.42120498418807983, 0.3219049870967865, 0.4221370816230774, -1.3751661777496338, 0.20832176506519318, -0.15642079710960388, -0.019159317016601562, -0.10149957239627838, -0.07526232302188873, 0.38308948278427124, 0.41983848810195923, -0.3396340310573578, -0.04124356061220169, -0.2144632637500763, 0.43553829193115234, -0.49572786688804626, 0.45492881536483765, 0.2947790026664734, -0.12112989276647568, 0.42661333084106445, 0.049740977585315704, -0.1851181536912918, 0.23058517277240753, 0.6559059619903564, -0.13382688164710999, -0.40951430797576904, 0.5289642214775085, -0.7115406394004822, 0.49757057428359985, 0.3805500268936157, 0.15487326681613922, -0.2843770682811737, -0.21611878275871277, 0.1735387146472931, 0.24252046644687653, 0.09578035771846771, -0.456052303314209, 0.45893269777297974, 0.31234216690063477, -0.19636787474155426, 0.0817960649728775, -0.7260170578956604, -0.06771581619977951, -0.02330039069056511, 0.34700968861579895, -0.1769697666168213, 0.14113923907279968, -0.30407553911209106, 0.1658673733472824, -0.02264910377562046, 0.11723387241363525, -0.34386786818504333, 0.031192364171147346, 0.30862972140312195, 0.08228828758001328, 0.07565971463918686, 0.11234541982412338, -0.013223767280578613, 0.3752405047416687, -0.30098557472229004, -0.31833794713020325, 0.047820836305618286, -0.1283988505601883, 0.23077701032161713, -0.3860223591327667, -0.032193560153245926, 0.038372647017240524, -0.03908997029066086, 0.04088144749403, -0.129859060049057, 0.42381542921066284, -0.2915990650653839, 0.5980413556098938, -0.12895876169204712, 0.2096407413482666, -1.243570327758789, 0.3429144322872162, 0.513032853603363, -0.011483872309327126, -0.01610761135816574, -0.18835406005382538, -0.41721948981285095, -0.1332818865776062, -0.6112943291664124, 0.536255955696106, -0.094984270632267, -0.32747992873191833, -0.35803407430648804, 0.2638532221317291, 0.2925602197647095, 0.12261988967657089, 0.4966830909252167, 0.30903610587120056, 0.45810291171073914, 0.3089650273323059, -0.24522818624973297, 0.05901443213224411, 0.1471199244260788, 0.1437862515449524, 0.2651997208595276, 0.5310576558113098, 0.3501899838447571, -0.8802953362464905, 0.13864107429981232, 0.2072814702987671, -0.2843438386917114, -0.3494732975959778, 0.4994352459907532, 0.3256068825721741, 0.03617929667234421, -0.21046796441078186, -0.17180228233337402, -0.34546327590942383, -0.518719494342804, 0.39688679575920105, 0.18582625687122345, -0.16331836581230164, -0.1754811406135559, -0.5048746466636658, 0.23620028793811798, -0.22855855524539948, 0.06145492196083069, -0.27321887016296387, 0.4265781342983246, 0.32752034068107605, -0.43398764729499817, 1.780234932899475, -0.27593496441841125, -0.11565414816141129, -0.025359200313687325, 0.07280123233795166, 0.5460150837898254, -0.22980256378650665, 0.24058887362480164, 0.14993277192115784, -0.3225025236606598, 0.28327006101608276, -0.024531370028853416, -0.39141735434532166, -0.2615518271923065, -0.0024463613517582417, -0.5242587924003601, 0.2157103419303894, -0.2926061153411865, 0.36307811737060547, 0.08334649354219437, 0.48141181468963623, -0.4680572748184204, 0.17233653366565704, -0.5981602668762207, -0.7008752822875977, 0.2882472574710846, -0.2361663430929184, -0.3189001977443695, 0.5088678002357483, -0.06627834588289261, 0.3630504310131073, -0.2501903772354126, 0.13583219051361084, -0.02376312017440796, 0.05053636059165001, -0.24981506168842316, 0.1712590456008911, -0.03607219085097313, -0.04756901413202286, -0.14107383787631989, 0.08505024760961533, -0.4341421127319336, -0.3075927197933197, 0.13982436060905457, -0.351220965385437, 0.6118596792221069, 0.0685606598854065, -0.09057459980249405, -0.042288582772016525, -0.2825644612312317, -0.0247552040964365, -0.4349459409713745, 0.049743082374334335, 0.32608747482299805, 0.03914905712008476, 0.2046733796596527, 0.12778162956237793, -0.06328822672367096, -0.17993208765983582, 0.6717338562011719, -0.5645511150360107, 0.06447375565767288, 0.22136731445789337, -0.4804987609386444, 0.2874006927013397, 0.16254620254039764, -0.3663550317287445, 0.06541944295167923, 0.28663942217826843, 0.22186073660850525, -0.768125057220459, -0.06791763752698898, -0.15354342758655548, 0.12846925854682922, 0.6454244256019592, 0.17939409613609314, 0.1552404761314392, 0.18566444516181946, -2.019766330718994, 0.027658572420477867, -0.0637126937508583, -0.09286469221115112, 0.2838715612888336, 0.33783239126205444, 0.5078136324882507, -0.051721569150686264, 0.08461225777864456, 0.42153200507164, 0.3248494267463684, -0.6534098982810974, 0.1641954779624939, -0.38245970010757446, -0.3798925578594208, 0.02551165223121643, 0.38943853974342346, -0.12519389390945435, 0.09903798997402191, 0.48780831694602966, -0.01811789534986019, 0.4783611595630646, -0.3746334910392761, -0.01810513250529766, -0.6264858245849609, -0.45440128445625305, -0.4343136250972748, 0.555066704750061, 0.08582336455583572, 0.2540826201438904, 0.4111096262931824, -0.08068689703941345, 0.1395426243543625, 0.32896533608436584, -0.3859056234359741, -0.2721859812736511, 0.13537578284740448, 0.18079672753810883, -0.759847104549408, 0.2789669930934906, 0.2472856044769287, -0.46972501277923584, -0.6973586082458496, 0.3042770028114319, 0.17083752155303955, 0.46674513816833496, 0.2711435556411743, 0.464407742023468, -0.01563413441181183, 0.17806695401668549, 0.5727675557136536, 0.03561520576477051, -0.920479416847229, 0.13709349930286407, -0.1599246859550476, 0.4253135323524475, 0.12926426529884338, -0.0933178961277008, 0.49980974197387695, -0.057441383600234985, 0.16782133281230927, 0.20482702553272247, -0.2353064864873886, 0.3457759916782379, -0.15007691085338593, 0.052155692130327225, 0.6054020524024963, -0.10240575671195984, -0.10275417566299438, -0.008768334053456783, 0.14308400452136993, -0.2845083475112915, 0.211418017745018, -0.09427820891141891, 0.2193147987127304, -0.4397425353527069, 0.1491849422454834, -0.2856934070587158, -0.30541592836380005, 0.32858195900917053, -0.0344611331820488, -0.2002153843641281, -0.032999437302351, 0.4174789786338806, -0.10320640355348587, -0.4835611879825592, -0.643187403678894, 0.2904703617095947, 0.2849770784378052, 0.45970436930656433, -0.4671192169189453, -0.5095667839050293, 0.22216114401817322, -0.47701284289360046, 0.3445839285850525, -0.3693062663078308, 0.05005593225359917, 0.2819678783416748, 0.3344113230705261, -0.04309134930372238, -0.1546379029750824, -0.09744458645582199, -0.12810984253883362, 0.12362393736839294, 0.12127415090799332, -0.5291693806648254, -0.9505281448364258, 0.28628310561180115, -0.17922843992710114, -0.5370204448699951, 0.14971207082271576, 0.019386261701583862, 0.5289759039878845, -0.3966006636619568, 0.22986742854118347, -0.6282252669334412, 0.11583985388278961, -0.2901017367839813, -0.07168975472450256, -0.21911516785621643, -0.07238052785396576, -0.515209972858429, 0.20845729112625122, 0.023215314373373985, 0.857803463935852, -0.09444469213485718, -0.03277201950550079, -0.29556530714035034, -0.01524239033460617, 0.13535457849502563, -0.7292568683624268, -0.4850911498069763, -0.24420325458049774, -0.23027217388153076, -0.4123331606388092, 0.01698797382414341, 0.13037364184856415, -0.02268531173467636, 0.2937948405742645, 0.2277262955904007, 0.32824698090553284, -0.9304085373878479, -0.03990575298666954, 0.26207268238067627, -0.18674127757549286, 0.044798463582992554, -0.13961757719516754, -0.13805541396141052, -0.3100256025791168, -0.017231127247214317, -0.17434817552566528, -0.6074383854866028, -0.20214693248271942, -0.1881837546825409, -0.38639122247695923, 0.4495062828063965, 0.05972200632095337, 0.37135258316993713, 0.3414979875087738, 0.0039483229629695415, -0.23661993443965912, -0.7765422463417053, 0.21247026324272156, 0.07906066626310349, 0.4493262767791748, 0.01331324689090252, -0.18114931881427765, -0.0745924636721611, 0.06377062946557999, 0.3139767348766327, -0.6566298604011536, 0.6671550869941711, 0.3123320937156677, 0.06550060212612152, 0.6004573702812195, -0.050371795892715454, 0.353111207485199, -0.17215684056282043, -0.1702198088169098, 0.28847625851631165 ], "id": "3152f09d-d0fc-4561-bd66-8519e38fa5f5", "publication_date": 1708560000000, "selection_readable_ids": [ "rgb", "dotnet-libraries" ], "synced": false, "title": "Вспомогательные методы для работы с операциями ProcessFlow", "type": "Разработка", "website": "https://confluence.gnivc.ru/pages/viewpage.action?pageId=151663988" } ] ```
Synonyms ```json { "synonyms": [ { "id": "FF9gYADxR4jLP7XFxfkiU", "locale": "ru", "root": "", "synonyms": [ "алгоритм", "метод" ] } ] } ```
Search ```json {"searches":[{"exhaustive_search":true,"query_by":"title,description,type,selection_readable_ids","highlight_full_fields":"title,description,type,selection_readable_ids","collection":"guru_data6","q":"алгоритм","facet_by":"type","max_facet_values":10,"page":1,"per_page":12}]} ```

Expected Behavior

Full synonym marked/highlighted. No letters erase at least.

Actual Behavior

<mark></mark>етоды instead of full word highlight, and leading letter М just disappear.

Metadata

Typesense Version: v26 / v27.rc13 no difference.

Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment
Labels
None yet
Projects
None yet
Development

No branches or pull requests

1 participant