|
124 | 124 | "- pyTorch Sentence transformers : `{'smpnet','st5','sdistilroberta','sminilm','sent_glove'}`\n", |
125 | 125 | "- pyTorch Word transformers :`{'bert', 'distilbert', 'roberta', 'xlnet', 'albert'}`\n", |
126 | 126 | "\n", |
| 127 | + "Custom Word or Sentence embedding models can be specified using a file path or HuggingFace identifier and a corresponding argument to `emb.build_blocks`\n", |
| 128 | + "- Custom Sentence transformers: `vectorizer='model_name'` and `emb.build_blocks(..., custom_pretrained_model='sentence')`\n", |
| 129 | + "- Custom Word transformers: `vectorizer='model_name'` and `emb.build_blocks(..., custom_pretrained_model='word')`\n", |
| 130 | + "\n", |
127 | 131 | "## FAISS\n", |
128 | 132 | "\n", |
129 | 133 | "faiss.IndexIVFFlat is an implementation of an inverted file index with coarse quantization. This index is used to efficiently search for nearest neighbors of a query vector in a large dataset of vectors. Here's a brief explanation of the parameters used in this index:\n" |
|
11542 | 11546 | 0.041863806545734406, |
11543 | 11547 | -0.19797062873840332, |
11544 | 11548 | 0.08422613888978958, |
11545 | | - -0.0004040927451569587, |
| 11549 | + -4.040927451569587E-4, |
11546 | 11550 | 0.10142297297716141, |
11547 | 11551 | -0.1592729687690735, |
11548 | 11552 | -0.13892339169979095, |
|
12278 | 12282 | 0.01203717477619648, |
12279 | 12283 | 0.03730224072933197, |
12280 | 12284 | 0.00999721884727478, |
12281 | | - -0.0000967714368016459, |
| 12285 | + -9.67714368016459E-5, |
12282 | 12286 | -0.0012333603808656335, |
12283 | 12287 | 0.0049127815291285515, |
12284 | 12288 | -0.042411092668771744, |
|
12326 | 12330 | -0.1373370885848999, |
12327 | 12331 | -0.09738717973232269, |
12328 | 12332 | -0.08944021910429001, |
12329 | | - -0.000026221718144370243, |
| 12333 | + -2.6221718144370243E-5, |
12330 | 12334 | 0.1785321682691574, |
12331 | 12335 | -0.14823342859745026, |
12332 | 12336 | 0.29911166429519653, |
|
12496 | 12500 | -0.15336649119853973, |
12497 | 12501 | -0.17148637771606445, |
12498 | 12502 | -0.04576775059103966, |
12499 | | - -0.0002886982692871243, |
| 12503 | + -2.886982692871243E-4, |
12500 | 12504 | 0.05859009176492691, |
12501 | 12505 | 0.02274763211607933, |
12502 | 12506 | -0.21441605687141418, |
|
12794 | 12798 | 0.020745988935232162, |
12795 | 12799 | -0.3763636648654938, |
12796 | 12800 | -0.39480143785476685, |
12797 | | - 0.0006196317262947559, |
| 12801 | + 6.196317262947559E-4, |
12798 | 12802 | -0.3080458641052246, |
12799 | 12803 | 0.05050341784954071, |
12800 | 12804 | 0.04591885954141617, |
|
14196 | 14200 | -0.23650690913200378, |
14197 | 14201 | -0.2087535709142685, |
14198 | 14202 | -0.2256527990102768, |
14199 | | - -0.0006704668630845845, |
| 14203 | + -6.704668630845845E-4, |
14200 | 14204 | -0.23260481655597687, |
14201 | 14205 | 0.059237588196992874, |
14202 | 14206 | 0.05719619616866112, |
|
14286 | 14290 | 0.10674760490655899, |
14287 | 14291 | -0.058976732194423676, |
14288 | 14292 | 0.09496849775314331, |
14289 | | - 0.00004359266677056439, |
| 14293 | + 4.359266677056439E-5, |
14290 | 14294 | -0.22975105047225952, |
14291 | 14295 | -0.27638518810272217, |
14292 | 14296 | 0.09805252403020859, |
|
14691 | 14695 | -0.23680473864078522, |
14692 | 14696 | -0.07355748116970062, |
14693 | 14697 | -0.2165745049715042, |
14694 | | - 0.0005726073868572712, |
| 14698 | + 5.726073868572712E-4, |
14695 | 14699 | -0.07698024809360504, |
14696 | 14700 | 0.054467570036649704, |
14697 | 14701 | 0.3693055808544159, |
|
14762 | 14766 | -0.034802526235580444, |
14763 | 14767 | 0.12485354393720627, |
14764 | 14768 | 0.20356221497058868, |
14765 | | - -0.0005281756748445332, |
| 14769 | + -5.281756748445332E-4, |
14766 | 14770 | 0.09996781498193741, |
14767 | 14771 | 0.067182257771492, |
14768 | 14772 | -0.2062978595495224, |
|
14936 | 14940 | 0.32058626413345337, |
14937 | 14941 | -0.3016047179698944, |
14938 | 14942 | -0.08911110460758209, |
14939 | | - -0.0007734508835710585, |
| 14943 | + -7.734508835710585E-4, |
14940 | 14944 | -0.07933899015188217, |
14941 | 14945 | -0.29577797651290894, |
14942 | 14946 | -0.3050692677497864, |
|
15181 | 15185 | -0.2573504149913788, |
15182 | 15186 | 0.03609131649136543, |
15183 | 15187 | -0.0062813530676066875, |
15184 | | - 0.00045815910561941564, |
| 15188 | + 4.5815910561941564E-4, |
15185 | 15189 | 0.14266984164714813, |
15186 | 15190 | 0.10829097777605057, |
15187 | 15191 | 0.13612718880176544, |
|
15607 | 15611 | -0.28111472725868225, |
15608 | 15612 | 0.20452271401882172, |
15609 | 15613 | 0.08420056104660034, |
15610 | | - 0.0007678090478293598, |
| 15614 | + 7.678090478293598E-4, |
15611 | 15615 | -0.20812328159809113, |
15612 | 15616 | -0.3826219141483307, |
15613 | 15617 | -0.05620969459414482, |
|
43579 | 43583 | 0.04186234250664711, |
43580 | 43584 | -0.1979692131280899, |
43581 | 43585 | 0.08422474563121796, |
43582 | | - -0.00040560279740020633, |
| 43586 | + -4.0560279740020633E-4, |
43583 | 43587 | 0.101422019302845, |
43584 | 43588 | -0.15927384793758392, |
43585 | 43589 | -0.1389235258102417, |
|
44315 | 44319 | 0.012037341482937336, |
44316 | 44320 | 0.03730267286300659, |
44317 | 44321 | 0.009998459368944168, |
44318 | | - -0.00009480538574280217, |
| 44322 | + -9.480538574280217E-5, |
44319 | 44323 | -0.0012314494233578444, |
44320 | 44324 | 0.0049147047102451324, |
44321 | 44325 | -0.042409781366586685, |
|
44363 | 44367 | -0.13733446598052979, |
44364 | 44368 | -0.09738475829362869, |
44365 | 44369 | -0.08943670243024826, |
44366 | | - -0.00002462582051521167, |
| 44370 | + -2.462582051521167E-5, |
44367 | 44371 | 0.1785307079553604, |
44368 | 44372 | -0.14823150634765625, |
44369 | 44373 | 0.2991122305393219, |
|
44533 | 44537 | -0.15336599946022034, |
44534 | 44538 | -0.1714865267276764, |
44535 | 44539 | -0.045769669115543365, |
44536 | | - -0.0002892519987653941, |
| 44540 | + -2.892519987653941E-4, |
44537 | 44541 | 0.058590117841959, |
44538 | 44542 | 0.022746196016669273, |
44539 | 44543 | -0.21441666781902313, |
|
44831 | 44835 | 0.02074439823627472, |
44832 | 44836 | -0.37636175751686096, |
44833 | 44837 | -0.39480140805244446, |
44834 | | - 0.0006176820024847984, |
| 44838 | + 6.176820024847984E-4, |
44835 | 44839 | -0.3080475628376007, |
44836 | 44840 | 0.050506748259067535, |
44837 | 44841 | 0.04591672495007515, |
|
45800 | 45804 | 0.38535815477371216, |
45801 | 45805 | 0.07165347784757614, |
45802 | 45806 | 0.2231462001800537, |
45803 | | - 0.0009984212229028344, |
| 45807 | + 9.984212229028344E-4, |
45804 | 45808 | 0.2918051481246948, |
45805 | 45809 | 0.28693827986717224, |
45806 | 45810 | -0.09961967915296555, |
|
46232 | 46236 | -0.23650597035884857, |
46233 | 46237 | -0.20875486731529236, |
46234 | 46238 | -0.22565750777721405, |
46235 | | - -0.0006674157339148223, |
| 46239 | + -6.674157339148223E-4, |
46236 | 46240 | -0.23261016607284546, |
46237 | 46241 | 0.05923283472657204, |
46238 | 46242 | 0.05719119682908058, |
|
46322 | 46326 | 0.10675148665904999, |
46323 | 46327 | -0.058976758271455765, |
46324 | 46328 | 0.09496378153562546, |
46325 | | - 0.00003729849049705081, |
| 46329 | + 3.729849049705081E-5, |
46326 | 46330 | -0.22975380718708038, |
46327 | 46331 | -0.2763764262199402, |
46328 | 46332 | 0.09804049134254456, |
|
46727 | 46731 | -0.2367977499961853, |
46728 | 46732 | -0.07355692982673645, |
46729 | 46733 | -0.2165636569261551, |
46730 | | - 0.0005692781996913254, |
| 46734 | + 5.692781996913254E-4, |
46731 | 46735 | -0.07698062807321548, |
46732 | 46736 | 0.054483864456415176, |
46733 | 46737 | 0.369301974773407, |
|
46798 | 46802 | -0.03479684516787529, |
46799 | 46803 | 0.12484855204820633, |
46800 | 46804 | 0.2035500407218933, |
46801 | | - -0.0005334240850061178, |
| 46805 | + -5.334240850061178E-4, |
46802 | 46806 | 0.09996215999126434, |
46803 | 46807 | 0.06717655062675476, |
46804 | 46808 | -0.20629936456680298, |
|
46972 | 46976 | 0.3205871284008026, |
46973 | 46977 | -0.30160635709762573, |
46974 | 46978 | -0.08910681307315826, |
46975 | | - -0.0007655520457774401, |
| 46979 | + -7.655520457774401E-4, |
46976 | 46980 | -0.07933466136455536, |
46977 | 46981 | -0.2957795262336731, |
46978 | 46982 | -0.30506977438926697, |
|
47217 | 47221 | -0.25735044479370117, |
47218 | 47222 | 0.03609400615096092, |
47219 | 47223 | -0.00628046365454793, |
47220 | | - 0.0004585284332279116, |
| 47224 | + 4.585284332279116E-4, |
47221 | 47225 | 0.14267142117023468, |
47222 | 47226 | 0.10829322040081024, |
47223 | 47227 | 0.13612817227840424, |
|
47643 | 47647 | -0.2811163365840912, |
47644 | 47648 | 0.20452405512332916, |
47645 | 47649 | 0.08419119566679001, |
47646 | | - 0.0007738231215626001, |
| 47650 | + 7.738231215626001E-4, |
47647 | 47651 | -0.20812755823135376, |
47648 | 47652 | -0.3826282024383545, |
47649 | 47653 | -0.05621104687452316, |
|
47889 | 47893 | -0.19475585222244263, |
47890 | 47894 | -0.28821855783462524, |
47891 | 47895 | -0.295050710439682, |
47892 | | - -0.00009316201612818986, |
| 47896 | + -9.316201612818986E-5, |
47893 | 47897 | 0.11140735447406769, |
47894 | 47898 | 0.09493596851825714, |
47895 | 47899 | -0.051914915442466736, |
|
48251 | 48255 | 0.2557325065135956, |
48252 | 48256 | 0.29231905937194824, |
48253 | 48257 | -0.15225599706172943, |
48254 | | - -0.0006214584573172033, |
| 48258 | + -6.214584573172033E-4, |
48255 | 48259 | 0.04559261351823807, |
48256 | 48260 | 0.37871798872947693, |
48257 | 48261 | 0.2513127326965332, |
|
48793 | 48797 | -0.08106150478124619, |
48794 | 48798 | -0.0757635086774826, |
48795 | 48799 | -0.0913897454738617, |
48796 | | - -0.000560691230930388, |
| 48800 | + -5.60691230930388E-4, |
48797 | 48801 | -0.22720053791999817, |
48798 | 48802 | 0.21542513370513916, |
48799 | 48803 | -0.05549247935414314, |
|
48890 | 48894 | -0.17256703972816467, |
48891 | 48895 | -0.22397547960281372, |
48892 | 48896 | -0.21700340509414673, |
48893 | | - 0.0004682873550336808, |
| 48897 | + 4.682873550336808E-4, |
48894 | 48898 | 0.15235066413879395, |
48895 | 48899 | -0.20267672836780548, |
48896 | 48900 | 0.16648273169994354, |
|
49655 | 49659 | 0.12497597932815552, |
49656 | 49660 | -0.09104467183351517, |
49657 | 49661 | 0.21928001940250397, |
49658 | | - 0.00009569602116243914, |
| 49662 | + 9.569602116243914E-5, |
49659 | 49663 | -0.0020389629062265158, |
49660 | 49664 | -0.16811877489089966, |
49661 | 49665 | 0.017217257991433144, |
|
0 commit comments