naranor commited on
Commit
d8482d3
·
verified ·
1 Parent(s): c0a1551

Initial export with WAMP attention weights (INT8 ONNX)

Browse files
.gitattributes CHANGED
@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ model.onnx.data filter=lfs diff=lfs merge=lfs -text
37
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,71 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: setfit
3
+ license: mit
4
+ base_model: sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2
5
+ tags:
6
+ - setfit
7
+ - onnx
8
+ - attention-weights
9
+ - context-compression
10
+ - intent-classification
11
+ - multilingual
12
+ pipeline_tag: text-classification
13
+ ---
14
+
15
+ # SetFit Multilingual OVR Router (ONNX with Attentions)
16
+
17
+ This is a State-of-the-Art **SetFit** model exported to **ONNX** format, specifically trained to classify LLM tasks into three semantic categories: **Needle** (Fact Retrieval), **Reasoning** (Logic/Analysis), and **Summary** (General Recap).
18
+
19
+ The model is based on [paraphrase-multilingual-MiniLM-L12-v2](https://huggingface.co/sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2) and has been modified to expose **all 12 layers of raw attention weights**.
20
+
21
+ ## Key Features
22
+
23
+ - **3-Class Classification:** High-precision separation of intents.
24
+ - **Multilingual:** Native support for Russian, English, and 50+ other languages.
25
+ - **Attention Output:** Every inference returns a full attention matrix `(batch, heads, seq_len, seq_len)` for all 12 layers.
26
+ - **Dual Precision:** Both **FP32** (`model.onnx`) and **INT8 Quantized** (`model_quantized.onnx`) versions are available.
27
+ - **Optimized for CPU:** Fast ONNX inference via `onnxruntime`.
28
+
29
+ ## Classification Map
30
+ - **Label 0:** Summary (Chatter, Recaps, TL;DR)
31
+ - **Label 1:** Needle (Pinpoint facts, parameters, keys, IPs)
32
+ - **Label 2:** Reasoning (Comparison, analysis, code debugging, logical chains)
33
+
34
+ ## Project Origin
35
+
36
+ This model is a core component of the **[WAMP-proxy](https://github.com/naranor/wamp-proxy)** project, an intelligent middleware for research into LLM context optimization.
37
+
38
+ ## Quick Inference (Python)
39
+
40
+ ```python
41
+ import numpy as np
42
+ import onnxruntime as ort
43
+ from transformers import AutoTokenizer
44
+ import json
45
+
46
+ # 1. Load model and weights
47
+ session = ort.InferenceSession("model.onnx")
48
+ tokenizer = AutoTokenizer.from_pretrained(".")
49
+ with open("router_weights_setfit.json", "r") as f:
50
+ weights = json.load(f)
51
+
52
+ # 2. Prepare Input
53
+ text = "What is the database port?"
54
+ inputs = tokenizer(text, return_tensors="np")
55
+ onnx_inputs = {
56
+ "input_ids": inputs["input_ids"].astype(np.int64),
57
+ "attention_mask": inputs["attention_mask"].astype(np.int64)
58
+ }
59
+
60
+ # 3. Run
61
+ outputs = session.run(None, onnx_inputs)
62
+ embeddings = np.mean(outputs[0], axis=1) # Mean pooling
63
+
64
+ # 4. Predict probabilities (LogReg Head)
65
+ scores = np.dot(embeddings, np.array(weights["coef"]).T) + weights["intercept"]
66
+ probs = np.exp(scores) / np.exp(scores).sum()
67
+ print(f"Probabilities: {probs}")
68
+ ```
69
+
70
+ ## License
71
+ MIT License.
model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41615aff1c6cee874e6ba7c0901aebe3555eff8aff9e0adf64edc670c1017241
3
+ size 1229334
model.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dceef97beff1382e8880bbd42c1e182980e4b0b000eadc40ffad67c3b530bbed
3
+ size 470040064
model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9150bcebd64dfdcd9e65e0b56b6d202c1230e406785ab665066cf19f8d2b3d7b
3
+ size 118758654
router_weights_setfit.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"coef": [[0.028468068428111754, -0.030329092560622876, 0.11839902135318583, 0.0005255069812434272, -0.013119884607757752, -0.014026226971872733, 0.007324444442594766, 0.03491407303510532, -0.07437404732765014, -0.038068830805335005, -0.04021658786542993, -0.02156441409126066, 0.0011877922779839776, 0.022737072728418472, 0.09350496659354632, -0.006933523624430427, 0.054094276010350925, 0.022016309473158375, -0.031689391666502864, 0.016151102546866906, -0.147082352391899, 0.07408666813880292, -0.04513706386037447, 0.04494651016067089, 0.019177229116895504, 0.01857915159491367, 0.04727457521930594, 0.009166076527889032, -0.06291764035325231, -0.09069661619560475, -0.03389691150999527, -0.0014319660189830543, -0.054050618584639526, 0.05036706947456197, -0.018811050161414523, 0.0974229114412268, -0.03565111517800568, -0.023227978539338542, -0.03204809958000711, 0.018534198458253107, 0.03225196021543347, 0.020270947028700144, -0.047326801327934404, 0.017829836617209455, 0.0018122070211680217, -0.08139799463633503, 0.012240528220923948, -0.006353264669203491, 0.04307579659133122, 0.05909942568330559, -0.06290170426992184, 0.02501945176563773, -0.037137061370123826, 0.016794555749237855, 0.03924258360877539, -0.04651920536678997, 0.03937230285779325, 0.009892140092662986, -0.004354436302071012, -0.01575087726428614, 0.03593334850973878, -0.020805377556656676, -0.0406822202168801, 0.0933032830335355, -0.06050211463524127, 0.0014714647996070028, -0.03660089193710596, 0.044550250490291016, -0.026221792356506627, 0.025678295528986612, -0.05048312167365473, 0.03863648974724897, -0.029358909846166188, 0.08828566424073381, -0.02791456274086588, -0.0084120124989798, 0.036222191973095424, 0.004581322887289848, 0.047323438425368826, -0.018481952940685113, 0.0066073719359825, 0.01761516795917219, -0.019874986124217987, 0.003490661297095746, -0.011211676371536904, 0.012049436209615445, -0.040485628627364066, 0.12307124344842968, -0.10558321123823586, -0.024489899041898203, -0.03505731699449296, 0.07394323993415776, 0.08379278859938845, 0.05455858173509188, -0.033290587904585806, -0.024146516888457537, 0.030984784075565448, -0.06805424821357937, -0.07542185594630801, 0.07753584900073694, 0.04154425961935182, -0.011334953873263921, 0.034374726639336085, -0.06371870577822294, -0.005374100798035061, 0.052412707660856636, -0.0369170033740138, -0.030579961996699923, -0.008860418718939474, -0.023150031045898817, -0.0006639561390991904, -0.06868400419194337, -0.011858459369880173, -0.09634062983752696, -0.029485267172787842, 0.058379960853138284, 0.028485997649346242, -0.020067677438527054, 0.00918169112545448, 0.002254547274577785, -0.02143676560590388, 0.05027906144529946, -0.04197627971230146, -0.01794766078837946, 0.06894192829804172, -0.11818826975294919, 0.045502991307655186, 0.022655091019037964, 0.01273891722992025, 0.08517841067775253, -0.033096314566927076, 0.05599155133256565, 0.1121532026520019, 0.033390277897385925, -0.03031080804845138, -0.039580369436720865, -0.029861857574880805, -0.05501275655058246, 0.043165779476514926, -0.017274056850365826, -0.04400600015266884, 0.01078596060128262, -0.06285842844661006, -0.09757439598558894, 0.04527782910798097, 0.03562580389353336, -0.009223852266101059, -0.042212847172026106, -0.0692320984784577, -0.002436589728953866, 0.018588145085118815, 0.10806675162779622, 0.04733696823276822, -0.0027018195379594763, -0.045964491155175584, -0.03234504020927437, 0.039222322615320826, -0.03619946217493956, -0.010868900025057405, -0.021138530150772845, 0.01874735783599683, 0.009501277987951686, -0.06088787355046987, -0.0909886416722473, -0.02884230220795261, 0.023179817356730473, -0.042267469516465976, 0.015068539919620599, -0.01838652584372639, 0.009794176458255779, -0.05642455510198704, -0.023649758498786772, -0.013037702836182814, -0.0498704240486455, 0.08785120833652559, 0.02348131352152086, 0.03149747909527489, -0.03125250698565939, 0.030280016623854315, 0.014512365530449572, 0.03300422411927791, 0.03545522354650992, -0.07674482722426548, -0.028266849717942102, -0.058849760501220906, -0.023056631986851334, 0.03396962932924641, 0.008525250304988515, 0.036033389073659224, 0.006082072198255436, -0.06131291839863628, -0.07885198671478334, -0.021708804625222657, 0.006070095534401605, -0.036623177446269306, 0.09217897112821555, -0.04073907193206177, 0.017227774026480975, -0.02644702815243245, 0.006795319525666379, 0.04787091688474401, -0.041682243414808064, 0.07213092071391497, 0.06563613441210195, 0.10905695516756345, -0.0938263570588183, 0.043562591407182785, -0.04371699700896158, 0.05538442378386121, 0.02836804642711683, -0.015306397724292502, -0.019983015244905804, 0.09318797821791319, 0.002829676593034357, 0.04291193820343903, -0.03789717759949964, 0.0272890788855013, 0.1072211703361009, -0.09305341642974543, -0.005441281736099744, 0.12538464241969438, 0.030371048018991542, 0.07555871489713163, -0.06734876197453082, 0.0820685091574704, -0.039178737596620994, -0.09532527988262286, 0.009980728343621207, 0.03465931404893548, -0.030931979160444375, 0.01859501139983911, 0.06653873527582005, -0.0885966285108659, 0.03306005802768046, -0.044791734197476514, -0.017212601440330735, -0.050791290200870656, -0.019626060720415676, -0.03962717058517083, -0.0004383312997196071, -0.02347087943624139, 0.0024821520766076196, 0.031791184900285374, 0.037726528633931264, 0.05613470585164043, 0.0626468821872141, -0.034142007245956875, 0.05241931401613148, 0.005627834111322209, 0.11810809595163338, 0.08716106613857036, -0.014458165675536967, 0.00284407888064478, 0.01903829043435574, 0.0015547821099073363, 0.03814697984263928, -0.07885633284699539, -0.0829044745166765, 0.09162555187363292, 0.031466219204050704, -0.03380467967942466, -0.11442452157827608, -0.02177813249203085, 0.022121745101519704, 0.005790768975344751, -0.07808762646651424, -0.048416256251020875, 0.004493132440690931, 0.03681503698265157, -0.07171137929006584, -0.06630943843206594, -0.008191165787205431, 0.003578085993634731, 0.019309663123976917, -0.05192145924522541, -0.04848759156020546, 0.024598624680475693, 0.023558872737031368, 0.015429247577405873, -0.008616738989680522, 0.042181014638446396, -0.08630233267524724, -0.00804845503785971, 0.0015552714662143462, -0.10069470518612886, -0.060891760857305376, 0.022298947238115718, -0.08002017662383952, 0.06370975199988879, 0.01652076146589003, 0.011680190743670608, 0.021015754141818443, -0.016183233132841403, -0.07682871812904571, -0.09728159980484873, -0.002465529298917037, -0.07926062750583308, 0.05799592005738833, 0.12649759076028, -0.06598309265044917, 0.0482403209273568, -0.11916430540799872, 0.030330567231406994, -0.0006416969907562122, 0.08768917336671087, 0.013118861597237077, 0.02152574698647322, -0.032641870642128715, 0.08428647378652536, 0.045434064274064406, -0.01139921882827238, 0.12748737547611788, 0.012539256952076513, 0.058684096954962225, -0.03970048961468089, -0.019768037027042072, 0.0304130388561869, 0.08041831511925009, 0.01436862458488767, -0.09658907657471488, 0.03533850187333295, 0.03112949109974117, -0.04659038133789124, -0.06413815975806156, 0.042502386049503495, 0.026702526070038167, -0.01006002156035539, -0.012556819239174023, 0.020081635875751784, -0.021817019011890218, -0.028904154700426187, -0.010979054960049929, -0.0393845988902475, 0.038584975252444545, -0.07111448477220543, 0.021619572907245366, -0.08546879863088488, -0.06658286150523766, 0.026484807146414557, -0.009580353791178723, -0.006559141177990381, 0.013784115890473386, -0.03844802889714092, 0.0275643915211318, 0.0253804347522271, 0.0005999287875547557, -0.022219847304261978, 0.020417125168864462, 0.030923961695060224, 0.07732905000543885, 0.0032810745107908117, 0.06626619014187066, -0.10533391354279745, 0.0005281939499037028, -0.0182602635831583, -0.048810728881935744, 0.10820930244352259, 0.04291835968383638, 0.10861546220306388, -0.009540288608019355, 0.008848760816972424, 0.023920888368157138, 0.024551815384157905, 0.04041543632104804, -0.031640212507277096, -0.06499066488822318, 0.05254639294795206, -0.008160765751959698, 0.007475918241954581, 0.006399929823740314, -0.01126567887879209, -0.11684532905672622, -0.035470422320944786, 0.048630629703984816, 0.07014923421719342, -0.014281134622418316, -0.04886216627997247, 0.017397730259623836, -0.09282459494314226, 0.05427010432921443, 0.06409235328118461, 0.022868399396825077, -0.05776144885040839, 0.05907768100332862], [0.013692676056475703, 0.04653776653725488, -0.06079714806645861, -0.03296189589856605, -0.03698225792741619, 0.01703561965449279, -0.00139438593633635, -0.03110355863421009, 0.025955926103189, -0.006073796182770177, 0.04360844951012254, -0.0342503384939325, -0.015122044414139555, -0.02743659418200463, -0.09391203768736021, -0.021810454076754172, -0.02978781082476716, 0.05269706562599843, 0.1428100447616157, -0.019243799104165956, 0.1326711802499114, -0.007621170093066757, -0.01610590336717944, -0.06346176418358544, 0.05394070681169501, 0.022065304869287785, 0.010522116063741652, 0.022719732025547168, 0.01900569637521746, 0.0245139812132313, 0.054699312638196475, -0.02585197662218886, 0.06678584324361644, 0.026282569129533095, 0.08097559763070201, -0.013270072396847632, -0.00010352112684771, 0.030662345223775696, 0.04680765361116303, -0.013116140408558536, -0.015211212555734039, -0.01626585941615247, 0.009144655576378323, -0.0029216582836205604, 0.05166862836753942, 0.09287687631000777, -0.05908628972130761, 0.01940007947064009, 0.04435865447066274, -0.022125489784692448, 0.03676689519311486, 0.017153669273095057, 0.012513458001971588, 0.008924902988994262, 0.04340757848231736, -0.034900678545782444, -0.05340268408428707, 0.0014413306333575283, 0.05197626905117796, 0.027267565714894415, -0.059920524639608924, 0.025039899106209233, -0.012134844229458935, -0.05508728364986815, -0.06421615258709165, 0.0661972007496278, 0.024654645126750894, -0.07787500342312015, 0.02807817463725102, -0.06470135185187613, 0.018041614665490563, -0.009217384481947363, 0.05261968218382017, -0.054235719479313285, -0.014149963975550527, 0.06642378662763765, -0.03706347390652834, 0.03890431236746374, -0.07752582232102333, 0.025462604612977204, -0.008536278998530102, -0.043433810157521575, -0.005068511658508858, 0.007037662074801709, 0.04406923382443007, 0.0014493179607468205, 0.015295494433038334, -0.020599619255320008, 0.09501082893529986, -0.015673356488092278, -0.001835269590436158, -0.1047846120251335, -0.06043097003184297, -0.07964036270276617, -0.012112336709509636, -0.03241247100519289, 0.031709764500224384, 0.03980380395418874, 0.07325735096235408, -0.029612012318792826, -0.00011840026521379974, 0.03479274008899117, -0.00017366810769490592, 0.025417228454625664, -0.013162675303524706, -0.02212818864214123, 0.06212723097518164, 0.04278288440870911, 0.049028347206627305, -0.01205796016957958, -0.024621127300198994, 0.034630756543800295, -0.004507013067229732, -0.02035201175328, 0.07213836727601178, -0.0323213888888638, -0.023537791346993322, -0.02272500851208461, -0.01713698267276275, -0.02167698872773904, 0.032322709231926226, 0.0024490528571165905, 0.027881116355276767, 0.028373265737024887, -0.11845123238546632, 0.0942405827427277, -0.006624504720044075, 0.022650307633089596, 0.024102187511776, -0.03592149591989693, 0.037292127259415685, 0.02174463555009612, -0.05522367977819438, -0.017693251055040188, 0.05977716794315016, 0.012760582503948795, -0.026414205700645028, 0.0652450267848556, -0.04581511747776373, -0.04932452991871764, -0.02001026672112385, -0.06189037907671507, -0.05911677845477234, 0.008676452389168187, 0.03683247236781886, -0.0522119724429059, -0.014082966330214665, 0.03588744335151078, 0.013881628051081387, 0.01858784430827442, -0.037846621240504134, -0.06623510082741763, -0.004840029236477729, 0.09732582109229407, 0.03887699191316355, -0.00550614338102082, 0.0645124524370628, 0.049730507244954404, 0.006435675951425629, -0.028701143604256782, 0.023021080773340516, -0.030244960735196825, 0.10938361868703975, 0.08561776649069647, -0.010287682797542625, -0.0677123702089685, 0.010731015477041844, -0.009887459279172641, 0.01606800877890118, -0.02082603214697186, 0.011556834309099307, 0.01014558860913115, -0.005442245496665186, 0.1079337718477871, -0.09748493628353666, 0.05104121361858788, 0.11792857684973679, -0.0006207539281699122, -0.06900136106385817, -0.004235115751726615, -0.12712725706553724, -0.001082149589183774, 0.04829101659415626, -0.011449974161861134, 0.024547283251788017, 0.009249999021098123, 0.027009294286620678, -0.00562213770579308, 0.051278853456553655, 0.04238248348821804, 0.02365663327908578, 0.019649112765508035, -0.002307306589835578, -0.058614934978719675, -0.017512985945448655, -0.05125350558620291, 0.002112037825853248, -0.06786260837715205, 0.005200193494488639, -0.008646849990615673, 0.020366650516547406, 0.023595564219172676, -0.06554052551333936, 0.020046743484218515, -0.07459725769620422, 0.027546275588621657, -0.0915977106158932, 0.015845090507110453, -0.07489633678358382, 0.021324915888299958, 0.06794386937767162, 0.029492333463106805, -0.021284657773236078, 0.009702034514923363, -0.01724731235949388, 0.08012453249329526, 0.0076179854938896565, -0.14372671879488838, -0.015910644267052937, 0.027059477883867467, -0.07621097097687303, -0.05518721063125731, -0.116136235896035, 0.01651986249801569, -0.009064145173330053, -0.005894699173124263, 0.05815432306475234, -0.032691467136489405, 0.0006313014294837601, -0.002240120558146687, -0.022923044683296142, 0.05335849636875492, 0.0738045964597702, -0.05925764746726707, 0.07787331753044041, 0.0009566250498372878, 0.08578990478029316, -0.07856268917522152, 0.062758183431521, 0.12505182001642914, -0.05058779528206289, -0.058212478070458575, -0.03537310232009565, 0.05469149184754396, -0.08558904603986466, -0.10701762247622916, 0.022590363388442468, -0.003820134679757611, -0.017830154820661734, -0.05208022068110576, 0.04056866619840077, 0.03233228164052967, -0.027040486952883344, 0.01296307720777568, -0.02011619832893537, -0.043776312681704996, 0.07439621800509365, 0.09826928547318545, -0.10442283853245173, -0.05297907986815246, 0.07487693495230802, 0.009996007945637498, -0.011749995790179192, -0.02273238659767789, 0.020869455548425925, 0.06932980577596295, 0.03158212406117764, 0.09722177053181433, -0.04977160138472827, -0.02972487133800247, -0.014840799767388084, 0.030178347925603758, -0.037379799635713654, 0.025400266292205508, -0.0002378323961803202, -0.010793679169998193, -0.010509085367357838, -0.011168051467580233, 0.05792881489371608, 0.05791029394855825, -0.06924936983182792, 0.05020146680057826, 0.03468392366008778, -0.017921964349629796, 0.02535700521339616, 0.04174287701451272, 0.00491702098583368, 0.024122378639442794, -0.07406652990965364, 0.01457379466925789, -0.020142812420393705, 0.06067288965457598, -0.07725942686746681, 0.06218599242780683, 0.005137954880629072, 0.030152324751362806, 0.08170676739935259, -0.0066587486407371525, -0.08530370812601942, 0.04270445821166073, -0.02283551862561647, 0.07775574159468464, -0.003531794034211723, -0.05207321808219299, -0.03277343656844646, 0.021722556718219137, -0.10910250877038295, 0.0420194721719678, -0.019948371657595203, -0.04228784429191654, 0.03649211476495125, -0.01702386482375709, 0.024695435480273756, 0.005882488921613842, 0.07423697569099182, -0.0018007386304836914, 0.02225474073787497, -0.013413718347426471, -0.0635015635206676, -0.00507994356474185, -0.05880895386011221, -0.009389762067477705, -0.012807989727689666, 0.053836259175358996, 0.07726205951764645, -0.0064794519880366904, 0.0222814643461658, 0.022301184849275887, 0.024349309238565653, -0.00011257047389743344, 0.01579021781579335, -0.021474564798754998, -0.004664987549581238, -0.03598663422342081, 0.029780319565682983, -0.11694813452060937, 0.05195952905318724, 0.03439897002088001, -0.008470862306359307, -0.027790208435362125, -0.06628076282911745, -0.03975053969399491, 0.07141520036360027, -0.08241731981637528, 0.04289095187234394, -0.05338572619689218, 0.000831301503233194, -0.01442625624560479, -0.0017469583475927493, -0.021208362083784463, -0.028349027131229228, -0.03631879949397976, 0.05313414804799489, -0.026158386317312644, -0.059511236349496614, 0.09792663628597172, -0.07474915249252521, -0.051215680671865944, -0.05419131612411609, -0.03023834754244367, 0.0025552121491245836, -0.01743813244742609, -0.028848768646688033, -0.03830557540086737, 0.04849686614009759, 0.07693174733968883, -0.04571403899980706, -0.03247494378280012, -0.002781436756600152, -0.007630595092642721, -0.03711713467277007, 0.0895654050443182, 0.016575360542900732, 0.005292280257850699, -0.017460601894104564, 0.04475634957436568, 0.018301126253385314, -0.08996194279295687, 0.02019148031441856, -0.051497305206179504, -0.05862713666045308, -0.02933719015850704, -0.04943317747554953, -0.036534452726273335], [-0.042160744484587516, -0.01620867397663205, -0.057601873286727195, 0.03243638891732262, 0.05010214253517396, -0.003009392682620034, -0.005930058506258446, -0.003810514400895266, 0.04841812122446114, 0.04414262698810517, -0.003391861644692649, 0.05581475258519325, 0.013934252136155584, 0.004699521453586119, 0.0004070710938138643, 0.028743977701184587, -0.024306465185583822, -0.07471337509915678, -0.11112065309511267, 0.003092696557299052, 0.014411172141987613, -0.06646549804573611, 0.061242967227553874, 0.018515254022914606, -0.07311793592859063, -0.04064445646420146, -0.0577966912830476, -0.031885808553436236, 0.04391194397803487, 0.06618263498237344, -0.02080240112820122, 0.027283942641171947, -0.012735224658976845, -0.07664963860409509, -0.06216454746928746, -0.0841528390443791, 0.035754636304853316, -0.007434366684437113, -0.014759554031155971, -0.005418058049694565, -0.01704074765969942, -0.004005087612547704, 0.038182145751556096, -0.014908178333588918, -0.05348083538870748, -0.011478881673672798, 0.04684576150038373, -0.01304681480143659, -0.087434451061994, -0.03697393589861306, 0.02613480907680695, -0.042173121038732816, 0.024623603368152308, -0.025719458738232105, -0.08265016209109276, 0.08141988391257245, 0.014030381226493858, -0.01133347072602054, -0.04762183274910702, -0.011516688450608296, 0.02398717612987009, -0.00423452154955256, 0.052817064446339046, -0.03821599938366749, 0.124718267222333, -0.0676686655492348, 0.01194624681035507, 0.0333247529328292, -0.001856382280744399, 0.03902305632288947, 0.03244150700816414, -0.02941910526530158, -0.023260772337653977, -0.03404994476142062, 0.042064526716416424, -0.05801177412865786, 0.0008412819334329323, -0.04348563525475359, 0.03020238389565443, -0.006980651672292138, 0.0019289070625475796, 0.025818642198349433, 0.024943497782726854, -0.010528323371897444, -0.032857557452893156, -0.013498754170362278, 0.025190134194325708, -0.1024716241931098, 0.010572382302935994, 0.04016325552999054, 0.036892586584929124, 0.03084137209097568, -0.023361818567545385, 0.025081780967674272, 0.04540292461409547, 0.05655898789365041, -0.06269454857578988, 0.02825044425939064, 0.002164504983953926, -0.04792383668194413, -0.041425859354138, -0.023457786215727274, -0.034201058531641126, 0.038301477323597254, 0.01853677610155976, -0.030284519018715393, -0.02521022760116785, -0.012202922412009242, -0.0401679284876879, 0.03520799121547839, 0.025285083439298237, 0.03405324764814303, 0.016365472437109944, 0.11669264159080693, -0.04265310010322394, -0.026058571964274472, -0.00494820630235296, 0.042792685950611656, 0.007955291547308273, 0.01942244145316131, -0.01088594362602239, -0.05272811430241602, 0.014095163357024718, -0.010425604948645403, 0.04950930408742463, 0.02394768701022145, -0.038878486587611144, -0.04530539865212758, -0.036841104741696294, -0.04925691475785557, -0.004195812692488633, -0.07773618688266186, -0.0569295228738075, -0.0156970268423457, -0.029466359894698816, 0.026819786932772052, 0.056276063275525846, -0.010232270234273214, 0.0026493380012488944, 0.0665985867690834, 0.06401626687379264, 0.051104418475432525, 0.12197520690138268, 0.08889794359642077, -0.08211030147579985, 0.016586168549372532, 0.02330681859631574, 0.006325403820515276, 0.05535047042737634, -0.016151254579320547, 0.019258476155385385, -0.041831650800378505, -0.04249693899629052, -0.09462400155433459, 0.007087499242012045, 0.037851183590295226, -0.10373477505238365, -0.013531045070014932, 0.004433224073631766, 0.04983967375502956, -0.041768438609337336, 0.020743682747245147, -0.04849574513656991, 0.005370875181550877, 0.039129985005495214, 0.04453255285223812, 0.03153645403942409, -0.005181080640447939, 0.0023185170648252168, 0.01103185568871606, 0.0448677207928877, 0.013504169889655629, 0.01847994833284798, -0.058063347799141664, 0.009633727947010963, -0.07452252714010874, -0.14942605594501174, 0.03187326091382923, 0.03872134444000385, -0.010277249778722913, 0.09412303294625941, -0.03437307395732618, 0.028453810630109246, 0.03971682387980322, 0.03430247724943297, 0.013806632965753194, -0.06097892361586717, -0.0029031125991954136, -0.08731224253021283, -0.04846455568647359, 0.03765628511955046, 0.05920287394927544, 0.024016111215058256, 0.05254483944431815, 0.05413616339171791, -0.04092546554201258, 0.03862703410620845, 0.05063483435067101, 0.021246834657943813, 0.0018515304649492754, -0.06823756740129144, 0.0180866791956354, -0.006590395200575624, -0.08568287789632058, -0.03445969747135928, 0.06628008147019668, 0.04803511920871051, 0.027871906501851104, 0.019511912999722575, -0.04969296231541683, -0.05263747165337913, -0.00950931821820102, -0.07190332044467712, -0.012531711107957725, -0.025664625843945094, -0.04222735489379554, -0.03490706437939097, 0.03650554845878759, 0.10896406069679847, -0.021618196147767724, -0.04917367144282124, 0.024816162612265855, 0.04057752099890331, 0.05082889947651515, -0.07300436398414044, 0.04507343676974526, 0.03717095681787058, 0.02271073879286816, -0.03529061547841931, 0.03317209971859105, 0.004328033283457016, -0.11989723164457486, 0.014792032051095548, 0.0261975894395867, -0.0330815833329639, 0.016255976390493438, -0.034998614579422535, 0.09818874989563707, -0.023131012846350156, -0.12461348871670976, 0.07405867471830435, 0.055730325993851006, 0.003581917419810251, -0.09241802048147521, 0.029454340188224223, 0.044370740289015075, 0.01155164385751444, -0.048599179336373984, 0.012202320709339519, -0.0660278752705277, -0.1277297323369713, -0.017874115964992724, 0.02419640807223857, -0.03200136764213143, 0.018561416219028043, 0.0056293328390657656, 0.004460114841901731, -0.015364810956508917, 0.01279728665881898, 0.021512860664101702, -0.04107225527288333, 0.10442851363263866, 0.033528128282210114, 0.0006106414961582441, -0.02666022452377072, 0.00875782069055116, 0.016834132189843233, -0.10171490297250518, 0.012956564402076714, 0.10143625062806833, 0.08115023819945406, -0.021987182138398315, 0.033801713642078915, -0.04470992941618245, 0.05215929164140572, 0.059281270730203665, -0.014089539313117778, -0.01239082126945114, -0.07335806247112202, -0.04929355495887777, 0.027068355193381535, 0.03610086587466898, -0.026635468622228098, 0.016366692883415437, 0.07533769997273267, 0.01914888384279272, -0.02721596822394937, 0.055897797984396674, 0.010356777909764789, -0.031094556135147965, 0.008462621676723112, -0.08168864379639437, 0.09344266000030814, 0.014642725701238746, 0.09214364492421967, -0.027686795452445817, -0.0024461398935194654, -0.05133717141665113, -0.04119388263426063, 0.023278634438788512, -0.025404802301740314, 0.04140856381331396, -0.026798773197195255, 0.05271491507294931, -0.054915736798264295, -0.03484141831545626, 0.08757676178390991, -0.009377601529839102, -0.0643381021289301, -0.003146219982147912, -0.025092895936678836, -0.110463510652361, -0.037234692432350246, -0.06456658587657613, -0.034536486076310956, 0.021568775657525754, -0.05266777959406189, -0.06700459677182359, 0.049132938935779885, 0.10166902013945689, 0.0234704519867792, -0.021739729032263462, 0.05939837106558099, 0.01030190058270259, -0.1197644455671501, -0.0202230740820015, -0.012221442785810449, -0.009744365610101809, -0.04443094511431738, 0.02192958948578768, 0.013113936884632842, 0.032453619758804925, 0.04404958643982874, -0.002598341029023738, 0.041334165206522396, 0.09532856161336392, 0.033509269577697696, 0.032183891484357574, -0.018013944840055217, 0.03737056222654082, 0.0728399040071079, 0.025966423803521526, -0.032967171466459444, 0.05485292829524351, -0.06827138662457094, 0.052785797409337414, 0.021388545801028776, -0.005990868923259698, -0.02917700334746743, -0.056120687921654394, 0.025067952620438382, -0.02994739064789101, 0.05219976549480272, 0.02563019236740891, 0.0777714999326549, -0.04911590740403607, -0.03346014995099733, 0.00829732098802963, -0.054424146078947674, 0.03977863615046308, -0.011403972966097017, -0.006482755920731003, 0.004296953262530169, -0.0021098609201806863, -0.01685665363282054, -0.011941082451465685, -0.006832353948144935, 0.04063570953475983, -0.004694481485354449, 0.0012306652689024326, 0.04838281355156215, 0.027279924012407933, 0.018895061778044044, -0.05392290996183548, -0.05268863232308877, -0.030475214951947386, 0.030561040026587213, 0.07256421253333299, 0.07263311462872374, -0.0027727991230348708, -0.005465216620731639, 0.006468790761681956, 0.107194626325958, -0.022543228277055256]], "intercept": [0.04574089582279315, -0.015594972179931981, -0.030145923642861346], "label_map": {"Summary": 0, "Needle": 1, "Reasoning": 2}}
special_tokens_map.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "cls_token": {
10
+ "content": "<s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "eos_token": {
17
+ "content": "</s>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "mask_token": {
24
+ "content": "<mask>",
25
+ "lstrip": true,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "pad_token": {
31
+ "content": "<pad>",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ },
37
+ "sep_token": {
38
+ "content": "</s>",
39
+ "lstrip": false,
40
+ "normalized": false,
41
+ "rstrip": false,
42
+ "single_word": false
43
+ },
44
+ "unk_token": {
45
+ "content": "<unk>",
46
+ "lstrip": false,
47
+ "normalized": false,
48
+ "rstrip": false,
49
+ "single_word": false
50
+ }
51
+ }
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a56def25aa40facc030ea8b0b87f3688e4b3c39eb8b45d5702b3a1300fe2a20
3
+ size 17082734
tokenizer_config.json ADDED
@@ -0,0 +1,65 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "<s>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "<pad>",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "2": {
20
+ "content": "</s>",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "3": {
28
+ "content": "<unk>",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "250001": {
36
+ "content": "<mask>",
37
+ "lstrip": true,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "bos_token": "<s>",
45
+ "clean_up_tokenization_spaces": false,
46
+ "cls_token": "<s>",
47
+ "do_lower_case": true,
48
+ "eos_token": "</s>",
49
+ "extra_special_tokens": {},
50
+ "mask_token": "<mask>",
51
+ "max_length": 128,
52
+ "model_max_length": 128,
53
+ "pad_to_multiple_of": null,
54
+ "pad_token": "<pad>",
55
+ "pad_token_type_id": 0,
56
+ "padding_side": "right",
57
+ "sep_token": "</s>",
58
+ "stride": 0,
59
+ "strip_accents": null,
60
+ "tokenize_chinese_chars": true,
61
+ "tokenizer_class": "PreTrainedTokenizerFast",
62
+ "truncation_side": "right",
63
+ "truncation_strategy": "longest_first",
64
+ "unk_token": "<unk>"
65
+ }