Adding ONNX file of this model

#48

by abukhoyer - opened Dec 17, 2025

base: refs/heads/main

←

from: refs/pr/48

Discussion Files changed

+151824

-319

Files changed (11) hide show

.gitattributes +1 -0
README.md +316 -315
onnx/added_tokens.json +5 -0
onnx/config.json +35 -0
onnx/merges.txt +0 -0
onnx/model.onnx +2 -2
onnx/model.onnx_data +2 -2
onnx/special_tokens_map.json +20 -0
onnx/tokenizer.json +3 -0
onnx/tokenizer_config.json +51 -0
onnx/vocab.json +0 -0

.gitattributes CHANGED Viewed

@@ -35,3 +35,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
 onnx/model.onnx_data filter=lfs diff=lfs merge=lfs -text
 onnx/model_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text

 *tfevents* filter=lfs diff=lfs merge=lfs -text
 onnx/model.onnx_data filter=lfs diff=lfs merge=lfs -text
 onnx/model_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
+onnx/tokenizer.json filter=lfs diff=lfs merge=lfs -text

README.md CHANGED Viewed

@@ -1,13 +1,22 @@
 ---
 model-index:
 - name: stella_en_1.5B_v5
   results:
-  - dataset:
-      config: en
       name: MTEB AmazonCounterfactualClassification (en)
-      revision: e8379541af4e31359cca9fbcf4b00f2671dba205
-      split: test
       type: mteb/amazon_counterfactual
     metrics:
     - type: accuracy
       value: 92.86567164179104
@@ -21,14 +30,14 @@ model-index:
       value: 93.13621183004571
     - type: main_score
       value: 92.86567164179104
-    task:
       type: Classification
-  - dataset:
-      config: default
       name: MTEB AmazonPolarityClassification
-      revision: e2d317d38cd51312af73b3d32a06d1a08b442046
-      split: test
       type: mteb/amazon_polarity
     metrics:
     - type: accuracy
       value: 97.16485
@@ -42,14 +51,14 @@ model-index:
       value: 97.16351087403213
     - type: main_score
       value: 97.16485
-    task:
       type: Classification
-  - dataset:
-      config: en
       name: MTEB AmazonReviewsClassification (en)
-      revision: 1399c76144fd37290681b995c656ef9b2e06e26d
-      split: test
       type: mteb/amazon_reviews_multi
     metrics:
     - type: accuracy
       value: 59.358
@@ -59,14 +68,14 @@ model-index:
       value: 59.0264615883114
     - type: main_score
       value: 59.358
-    task:
-      type: Classification
-  - dataset:
-      config: default
       name: MTEB ArguAna
-      revision: c22ab2a51041ffd869aaddef7af8d8215647e41a
-      split: test
       type: mteb/arguana
     metrics:
     - type: main_score
       value: 65.269
@@ -350,14 +359,14 @@ model-index:
       value: 67.354
     - type: recall_at_5
       value: 78.236
-    task:
-      type: Retrieval
-  - dataset:
-      config: default
       name: MTEB ArxivClusteringP2P
-      revision: a122ad7f3f0291bf49cc6f4d32aa80929df69d5d
-      split: test
       type: mteb/arxiv-clustering-p2p
     metrics:
     - type: main_score
       value: 55.437138353189994
@@ -365,14 +374,14 @@ model-index:
       value: 55.437138353189994
     - type: v_measure_std
       value: 14.718556601335491
-    task:
       type: Clustering
-  - dataset:
-      config: default
       name: MTEB ArxivClusteringS2S
-      revision: f910caf1a6075f7329cdf8c1a6135696f37dbd53
-      split: test
       type: mteb/arxiv-clustering-s2s
     metrics:
     - type: main_score
       value: 50.65858459544658
@@ -380,14 +389,14 @@ model-index:
       value: 50.65858459544658
     - type: v_measure_std
       value: 14.887033747525146
-    task:
-      type: Clustering
-  - dataset:
-      config: default
       name: MTEB AskUbuntuDupQuestions
-      revision: 2000358ca161889fa9c082cb41daa8dcfb161a54
-      split: test
       type: mteb/askubuntudupquestions-reranking
     metrics:
     - type: main_score
       value: 67.32597152838535
@@ -407,14 +416,14 @@ model-index:
       value: 41.64561939958336
     - type: nAUC_mrr_std
       value: 23.179909345891968
-    task:
-      type: Reranking
-  - dataset:
-      config: default
       name: MTEB BIOSSES
-      revision: d3fb88f8f02e40887cd149695127462bbcf29b4a
-      split: test
       type: mteb/biosses-sts
     metrics:
     - type: cosine_pearson
       value: 85.790820496042
@@ -434,14 +443,14 @@ model-index:
       value: 85.790820496042
     - type: spearman
       value: 83.10731534330517
-    task:
-      type: STS
-  - dataset:
-      config: default
       name: MTEB Banking77Classification
-      revision: 0fd18e25b25c072e09e0d92ab615fda904d66300
-      split: test
       type: mteb/banking77
     metrics:
     - type: accuracy
       value: 89.78896103896105
@@ -451,14 +460,14 @@ model-index:
       value: 89.76107366333488
     - type: main_score
       value: 89.78896103896105
-    task:
-      type: Classification
-  - dataset:
-      config: default
       name: MTEB BiorxivClusteringP2P
-      revision: 65b79d1d13f80053f67aca9498d9402c2d9f1f40
-      split: test
       type: mteb/biorxiv-clustering-p2p
     metrics:
     - type: main_score
       value: 50.68092296236376
@@ -466,14 +475,14 @@ model-index:
       value: 50.68092296236376
     - type: v_measure_std
       value: 0.7832640983085436
-    task:
       type: Clustering
-  - dataset:
-      config: default
       name: MTEB BiorxivClusteringS2S
-      revision: 258694dd0231531bc1fd9de6ceb52a0853c6d908
-      split: test
       type: mteb/biorxiv-clustering-s2s
     metrics:
     - type: main_score
       value: 46.86629236732983
@@ -481,14 +490,14 @@ model-index:
       value: 46.86629236732983
     - type: v_measure_std
       value: 0.8784322236350974
-    task:
-      type: Clustering
-  - dataset:
-      config: default
       name: MTEB CQADupstackRetrieval
-      revision: 4ffe81d471b1924886b33c7567bfb200e9eec5c4
-      split: test
       type: mteb/cqadupstack
     metrics:
     - type: main_score
       value: 47.74883333333334
@@ -772,14 +781,14 @@ model-index:
       value: 46.01841666666666
     - type: recall_at_5
       value: 52.482416666666666
-    task:
       type: Retrieval
-  - dataset:
-      config: default
       name: MTEB ClimateFEVER
-      revision: 47f2ac6acb640fc46020b02a5b59fdda04d39380
-      split: test
       type: mteb/climate-fever
     metrics:
     - type: main_score
       value: 46.113
@@ -1063,14 +1072,14 @@ model-index:
       value: 35.150999999999996
     - type: recall_at_5
       value: 42.748000000000005
-    task:
       type: Retrieval
-  - dataset:
-      config: default
       name: MTEB DBPedia
-      revision: c0f706b76e590d620bd6618b3ca8efdd34e2d659
-      split: test
       type: mteb/dbpedia
     metrics:
     - type: main_score
       value: 52.276999999999994
@@ -1354,14 +1363,14 @@ model-index:
       value: 17.876
     - type: recall_at_5
       value: 22.536
-    task:
-      type: Retrieval
-  - dataset:
-      config: default
       name: MTEB EmotionClassification
-      revision: 4f58c6b202a23cf9a4da393831edf4f9183cad37
-      split: test
       type: mteb/emotion
     metrics:
     - type: accuracy
       value: 84.29499999999999
@@ -1371,14 +1380,14 @@ model-index:
       value: 84.96026012933847
     - type: main_score
       value: 84.29499999999999
-    task:
-      type: Classification
-  - dataset:
-      config: default
       name: MTEB FEVER
-      revision: bea83ef9e8fb933d90a2f1d5515737465d613e12
-      split: test
       type: mteb/fever
     metrics:
     - type: main_score
       value: 94.83200000000001
@@ -1662,14 +1671,14 @@ model-index:
       value: 95.069
     - type: recall_at_5
       value: 96.177
-    task:
       type: Retrieval
-  - dataset:
-      config: default
       name: MTEB FiQA2018
-      revision: 27a168819829fe9bcd655c2df245fb19452e8e06
-      split: test
       type: mteb/fiqa
     metrics:
     - type: main_score
       value: 60.480000000000004
@@ -1953,14 +1962,14 @@ model-index:
       value: 50.221000000000004
     - type: recall_at_5
       value: 58.209999999999994
-    task:
       type: Retrieval
-  - dataset:
-      config: default
       name: MTEB HotpotQA
-      revision: ab518f4d6fcca38d87c25209f94beba119d02014
-      split: test
       type: mteb/hotpotqa
     metrics:
     - type: main_score
       value: 76.67399999999999
@@ -2244,14 +2253,14 @@ model-index:
       value: 68.879
     - type: recall_at_5
       value: 73.896
-    task:
-      type: Retrieval
-  - dataset:
-      config: default
       name: MTEB ImdbClassification
-      revision: 3d86128a09e091d6018b6d26cad27f2739fc2db7
-      split: test
       type: mteb/imdb
     metrics:
     - type: accuracy
       value: 96.6608
@@ -2265,14 +2274,14 @@ model-index:
       value: 96.66029695623423
     - type: main_score
       value: 96.6608
-    task:
-      type: Classification
-  - dataset:
-      config: default
       name: MTEB MSMARCO
-      revision: c5a29a104738b98a9e76336939199e264163d4a0
-      split: dev
       type: mteb/msmarco
     metrics:
     - type: main_score
       value: 45.217
@@ -2556,14 +2565,14 @@ model-index:
       value: 45.535
     - type: recall_at_5
       value: 55.394
-    task:
-      type: Retrieval
-  - dataset:
-      config: en
       name: MTEB MTOPDomainClassification (en)
-      revision: d80d48c1eb48d3562165c59d59d0034df9fff0bf
-      split: test
       type: mteb/mtop_domain
     metrics:
     - type: accuracy
       value: 99.01276789785682
@@ -2573,14 +2582,14 @@ model-index:
       value: 99.01406884928141
     - type: main_score
       value: 99.01276789785682
-    task:
       type: Classification
-  - dataset:
-      config: en
       name: MTEB MTOPIntentClassification (en)
-      revision: ae001d0e6b1228650b7bd1c2c65fb50ad11a8aba
-      split: test
       type: mteb/mtop_intent
     metrics:
     - type: accuracy
       value: 92.78385772913816
@@ -2590,14 +2599,14 @@ model-index:
       value: 93.90424147486428
     - type: main_score
       value: 92.78385772913816
-    task:
       type: Classification
-  - dataset:
-      config: en
       name: MTEB MassiveIntentClassification (en)
-      revision: 4672e20407010da34463acc759c162ca9734bca6
-      split: test
       type: mteb/amazon_massive_intent
     metrics:
     - type: accuracy
       value: 85.83053127101546
@@ -2607,14 +2616,14 @@ model-index:
       value: 85.81759723866098
     - type: main_score
       value: 85.83053127101546
-    task:
       type: Classification
-  - dataset:
-      config: en
       name: MTEB MassiveScenarioClassification (en)
-      revision: fad2c6e8459f9e1c45d9315f4953d921437d70f8
-      split: test
       type: mteb/amazon_massive_scenario
     metrics:
     - type: accuracy
       value: 90.19838601210489
@@ -2624,14 +2633,14 @@ model-index:
       value: 90.11422965504119
     - type: main_score
       value: 90.19838601210489
-    task:
-      type: Classification
-  - dataset:
-      config: default
       name: MTEB MedrxivClusteringP2P
-      revision: e7a26af6f3ae46b30dde8737f02c07b1505bcc73
-      split: test
       type: mteb/medrxiv-clustering-p2p
     metrics:
     - type: main_score
       value: 46.866746897607094
@@ -2639,14 +2648,14 @@ model-index:
       value: 46.866746897607094
     - type: v_measure_std
       value: 1.0966477896919726
-    task:
       type: Clustering
-  - dataset:
-      config: default
       name: MTEB MedrxivClusteringS2S
-      revision: 35191c8c0dca72d8ff3efcd72aa802307d469663
-      split: test
       type: mteb/medrxiv-clustering-s2s
     metrics:
     - type: main_score
       value: 44.6538827415503
@@ -2654,14 +2663,14 @@ model-index:
       value: 44.6538827415503
     - type: v_measure_std
       value: 1.1649569936599116
-    task:
-      type: Clustering
-  - dataset:
-      config: default
       name: MTEB MindSmallReranking
-      revision: 59042f120c80e8afa9cdbb224f67076cec0fc9a7
-      split: test
       type: mteb/mind_small
     metrics:
     - type: main_score
       value: 33.05449204940555
@@ -2681,14 +2690,14 @@ model-index:
       value: -15.304687384645769
     - type: nAUC_mrr_std
       value: -0.519919931348978
-    task:
-      type: Reranking
-  - dataset:
-      config: default
       name: MTEB NFCorpus
-      revision: ec0fa4fe99da2ff19ca1214b7966684033a58814
-      split: test
       type: mteb/nfcorpus
     metrics:
     - type: main_score
       value: 41.998000000000005
@@ -2972,14 +2981,14 @@ model-index:
       value: 13.267999999999999
     - type: recall_at_5
       value: 16.141
-    task:
       type: Retrieval
-  - dataset:
-      config: default
       name: MTEB NQ
-      revision: b774495ed302d8c44a3a7ea25c90dbce03968f31
-      split: test
       type: mteb/nq
     metrics:
     - type: main_score
       value: 71.8
@@ -3263,14 +3272,14 @@ model-index:
       value: 74.394
     - type: recall_at_5
       value: 82.711
-    task:
       type: Retrieval
-  - dataset:
-      config: default
       name: MTEB QuoraRetrieval
-      revision: e4e08e0b7dbe3c8700f0daef558ff32256715259
-      split: test
       type: mteb/quora
     metrics:
     - type: main_score
       value: 90.025
@@ -3554,14 +3563,14 @@ model-index:
       value: 89.276
     - type: recall_at_5
       value: 93.46
-    task:
-      type: Retrieval
-  - dataset:
-      config: default
       name: MTEB RedditClustering
-      revision: 24640382cdbf8abc73003fb0fa6d111a705499eb
-      split: test
       type: mteb/reddit-clustering
     metrics:
     - type: main_score
       value: 72.86492101891123
@@ -3569,14 +3578,14 @@ model-index:
       value: 72.86492101891123
     - type: v_measure_std
       value: 2.778711445144635
-    task:
       type: Clustering
-  - dataset:
-      config: default
       name: MTEB RedditClusteringP2P
-      revision: 385e3cb46b4cfa89021f56c4380204149d0efe33
-      split: test
       type: mteb/reddit-clustering-p2p
     metrics:
     - type: main_score
       value: 75.27316726548479
@@ -3584,14 +3593,14 @@ model-index:
       value: 75.27316726548479
     - type: v_measure_std
       value: 8.87871936725338
-    task:
-      type: Clustering
-  - dataset:
-      config: default
       name: MTEB SCIDOCS
-      revision: f8c2fcf00f625baaa80f62ec5bd9e1fff3b8ae88
-      split: test
       type: mteb/scidocs
     metrics:
     - type: main_score
       value: 26.638
@@ -3875,14 +3884,14 @@ model-index:
       value: 14.127999999999998
     - type: recall_at_5
       value: 19.673
-    task:
-      type: Retrieval
-  - dataset:
-      config: default
       name: MTEB SICK-R
-      revision: 20a6d6f312dd54037fe07a32d58e5e168867909d
-      split: test
       type: mteb/sickr-sts
     metrics:
     - type: cosine_pearson
       value: 86.86608529160739
@@ -3902,14 +3911,14 @@ model-index:
       value: 86.86608529160739
     - type: spearman
       value: 82.88625166203383
-    task:
       type: STS
-  - dataset:
-      config: default
       name: MTEB STS12
-      revision: a0d554a64d88156834ff5ae9920b964011b16384
-      split: test
       type: mteb/sts12-sts
     metrics:
     - type: cosine_pearson
       value: 87.0445014940449
@@ -3929,14 +3938,14 @@ model-index:
       value: 87.0445014940449
     - type: spearman
       value: 80.0880365116599
-    task:
       type: STS
-  - dataset:
-      config: default
       name: MTEB STS13
-      revision: 7e90230a92c190f1bf69ae9002b8cea547a64cca
-      split: test
       type: mteb/sts13-sts
     metrics:
     - type: cosine_pearson
       value: 89.33900828959968
@@ -3956,14 +3965,14 @@ model-index:
       value: 89.33900828959968
     - type: spearman
       value: 89.68256358526733
-    task:
       type: STS
-  - dataset:
-      config: default
       name: MTEB STS14
-      revision: 6031580fec1f6af667f0bd2da0a551cf4f0b2375
-      split: test
       type: mteb/sts14-sts
     metrics:
     - type: cosine_pearson
       value: 86.42029843639123
@@ -3983,14 +3992,14 @@ model-index:
       value: 86.42029843639123
     - type: spearman
       value: 85.0707889220723
-    task:
       type: STS
-  - dataset:
-      config: default
       name: MTEB STS15
-      revision: ae752c7c21bf194d8b67fd573edf7ae58183cbe3
-      split: test
       type: mteb/sts15-sts
     metrics:
     - type: cosine_pearson
       value: 88.3660081271444
@@ -4010,14 +4019,14 @@ model-index:
       value: 88.3660081271444
     - type: spearman
       value: 89.39375083609528
-    task:
       type: STS
-  - dataset:
-      config: default
       name: MTEB STS16
-      revision: 4d8694f8f0e0100860b497b999b3dbed754a0513
-      split: test
       type: mteb/sts16-sts
     metrics:
     - type: cosine_pearson
       value: 85.60708247171874
@@ -4037,14 +4046,14 @@ model-index:
       value: 85.60708247171874
     - type: spearman
       value: 87.15234952832193
-    task:
       type: STS
-  - dataset:
-      config: en-en
       name: MTEB STS17 (en-en)
-      revision: faeb762787bd10488a50c8b5be4a3b82e411949c
-      split: test
       type: mteb/sts17-crosslingual-sts
     metrics:
     - type: cosine_pearson
       value: 91.25898556808458
@@ -4064,14 +4073,14 @@ model-index:
       value: 91.25898556808458
     - type: spearman
       value: 91.35372390581641
-    task:
       type: STS
-  - dataset:
-      config: en
       name: MTEB STS22 (en)
-      revision: de9d86b3b84231dc21f76c7b7af1f28e2f57f6e3
-      split: test
       type: mteb/sts22-crosslingual-sts
     metrics:
     - type: cosine_pearson
       value: 67.61637111515797
@@ -4091,14 +4100,14 @@ model-index:
       value: 67.61637111515797
     - type: spearman
       value: 68.10379096526697
-    task:
       type: STS
-  - dataset:
-      config: default
       name: MTEB STSBenchmark
-      revision: b0fddb56ed78048fa8b90373c8a3cfc37b684831
-      split: test
       type: mteb/stsbenchmark-sts
     metrics:
     - type: cosine_pearson
       value: 87.81592853782297
@@ -4118,14 +4127,14 @@ model-index:
       value: 87.81592853782297
     - type: spearman
       value: 88.2302550329183
-    task:
-      type: STS
-  - dataset:
-      config: default
       name: MTEB SciDocsRR
-      revision: d3c5e1fc0b855ab6097bf1cda04dd73947d7caab
-      split: test
       type: mteb/scidocs-reranking
     metrics:
     - type: main_score
       value: 89.196009707431
@@ -4145,14 +4154,14 @@ model-index:
       value: 86.38341077184032
     - type: nAUC_mrr_std
       value: 75.38945014727746
-    task:
-      type: Reranking
-  - dataset:
-      config: default
       name: MTEB SciFact
-      revision: 0228b52cf27578f30900b9e5271d331663a030d7
-      split: test
       type: mteb/scifact
     metrics:
     - type: main_score
       value: 80.08999999999999
@@ -4436,14 +4445,14 @@ model-index:
       value: 80.972
     - type: recall_at_5
       value: 89.90599999999999
-    task:
-      type: Retrieval
-  - dataset:
-      config: default
       name: MTEB SprintDuplicateQuestions
-      revision: d66bd1f72af766a5cc4b0ca5e00c162f89e8cc46
-      split: test
       type: mteb/sprintduplicatequestions-pairclassification
     metrics:
     - type: cosine_accuracy
       value: 99.81881188118813
@@ -4525,14 +4534,14 @@ model-index:
       value: 92.59645464025026
     - type: similarity_recall
       value: 88.8
-    task:
-      type: PairClassification
-  - dataset:
-      config: default
       name: MTEB StackExchangeClustering
-      revision: 6cbc1f7b2bc0622f2e39d2c77fa502909748c259
-      split: test
       type: mteb/stackexchange-clustering
     metrics:
     - type: main_score
       value: 80.28558559137414
@@ -4540,14 +4549,14 @@ model-index:
       value: 80.28558559137414
     - type: v_measure_std
       value: 2.795276520287584
-    task:
       type: Clustering
-  - dataset:
-      config: default
       name: MTEB StackExchangeClusteringP2P
-      revision: 815ca46b2622cec33ccafc3735d572c266efdb44
-      split: test
       type: mteb/stackexchange-clustering-p2p
     metrics:
     - type: main_score
       value: 49.57135582416209
@@ -4555,14 +4564,14 @@ model-index:
       value: 49.57135582416209
     - type: v_measure_std
       value: 1.6414135468423754
-    task:
-      type: Clustering
-  - dataset:
-      config: default
       name: MTEB StackOverflowDupQuestions
-      revision: e185fbe320c72810689fc5848eb6114e1ef5ec69
-      split: test
       type: mteb/stackoverflowdupquestions-reranking
     metrics:
     - type: main_score
       value: 55.253002583598644
@@ -4582,14 +4591,14 @@ model-index:
       value: 10.586310195339053
     - type: nAUC_mrr_std
       value: 8.47326494370076
-    task:
-      type: Reranking
-  - dataset:
-      config: default
       name: MTEB SummEval
-      revision: cda12ad7615edc362dbf25a00fdd61d3b1eaf93c
-      split: test
       type: mteb/summeval
     metrics:
     - type: cosine_pearson
       value: 31.19874648747059
@@ -4605,14 +4614,14 @@ model-index:
       value: 31.19874648747059
     - type: spearman
       value: 31.493550648844863
-    task:
-      type: Summarization
-  - dataset:
-      config: default
       name: MTEB TRECCOVID
-      revision: bb9466bac8153a0349341eb1b22e06409e78ef4e
-      split: test
       type: mteb/trec-covid
     metrics:
     - type: main_score
       value: 85.983
@@ -4896,14 +4905,14 @@ model-index:
       value: 0.7250000000000001
     - type: recall_at_5
       value: 1.1820000000000002
-    task:
       type: Retrieval
-  - dataset:
-      config: default
       name: MTEB Touche2020
-      revision: a34f9a33db75fa0cbb21bb5cfc3dae8dc8bec93f
-      split: test
       type: mteb/touche2020
     metrics:
     - type: main_score
       value: 29.944
@@ -5187,14 +5196,14 @@ model-index:
       value: 7.383000000000001
     - type: recall_at_5
       value: 11.434
-    task:
-      type: Retrieval
-  - dataset:
-      config: default
       name: MTEB ToxicConversationsClassification
-      revision: edfaf9da55d3dd50d43143d90c1ac476895ae6de
-      split: test
       type: mteb/toxic_conversations_50k
     metrics:
     - type: accuracy
       value: 88.759765625
@@ -5208,14 +5217,14 @@ model-index:
       value: 90.54372649306606
     - type: main_score
       value: 88.759765625
-    task:
       type: Classification
-  - dataset:
-      config: default
       name: MTEB TweetSentimentExtractionClassification
-      revision: d604517c81ca91fe16a244d1248fc021f9ecee7a
-      split: test
       type: mteb/tweet_sentiment_extraction
     metrics:
     - type: accuracy
       value: 74.8443689869836
@@ -5225,14 +5234,14 @@ model-index:
       value: 74.7369003946243
     - type: main_score
       value: 74.8443689869836
-    task:
-      type: Classification
-  - dataset:
-      config: default
       name: MTEB TwentyNewsgroupsClustering
-      revision: 6125ec4e24fa026cec8a478383ee943acfbd5449
-      split: test
       type: mteb/twentynewsgroups-clustering
     metrics:
     - type: main_score
       value: 61.42918790942448
@@ -5240,14 +5249,14 @@ model-index:
       value: 61.42918790942448
     - type: v_measure_std
       value: 1.0156550098843082
-    task:
-      type: Clustering
-  - dataset:
-      config: default
       name: MTEB TwitterSemEval2015
-      revision: 70970daeab8776df92f5ea462b6173c0b46fd2d1
-      split: test
       type: mteb/twittersemeval2015-pairclassification
     metrics:
     - type: cosine_accuracy
       value: 88.22197055492639
@@ -5329,14 +5338,14 @@ model-index:
       value: 71.64922770303936
     - type: similarity_recall
       value: 75.8839050131926
-    task:
       type: PairClassification
-  - dataset:
-      config: default
       name: MTEB TwitterURLCorpus
-      revision: 8b6510b0b1fa4e4c4f879467980e9be563ec1cdf
-      split: test
       type: mteb/twitterurlcorpus-pairclassification
     metrics:
     - type: cosine_accuracy
       value: 89.88628866379477
@@ -5418,14 +5427,6 @@ model-index:
       value: 76.93126197063205
     - type: similarity_recall
       value: 83.50015398829689
-    task:
-      type: PairClassification
-tags:
-- mteb
-- sentence-transformers
-- transformers
-- sentence-similarity
-license: mit
 ---

 ---
+tags:
+- mteb
+- sentence-transformers
+- transformers
+- sentence-similarity
+- onnx
+license: mit
 model-index:
 - name: stella_en_1.5B_v5
   results:
+  - task:
+      type: Classification
+    dataset:
       name: MTEB AmazonCounterfactualClassification (en)
       type: mteb/amazon_counterfactual
+      config: en
+      split: test
+      revision: e8379541af4e31359cca9fbcf4b00f2671dba205
     metrics:
     - type: accuracy
       value: 92.86567164179104
       value: 93.13621183004571
     - type: main_score
       value: 92.86567164179104
+  - task:
       type: Classification
+    dataset:
       name: MTEB AmazonPolarityClassification
       type: mteb/amazon_polarity
+      config: default
+      split: test
+      revision: e2d317d38cd51312af73b3d32a06d1a08b442046
     metrics:
     - type: accuracy
       value: 97.16485
       value: 97.16351087403213
     - type: main_score
       value: 97.16485
+  - task:
       type: Classification
+    dataset:
       name: MTEB AmazonReviewsClassification (en)
       type: mteb/amazon_reviews_multi
+      config: en
+      split: test
+      revision: 1399c76144fd37290681b995c656ef9b2e06e26d
     metrics:
     - type: accuracy
       value: 59.358
       value: 59.0264615883114
     - type: main_score
       value: 59.358
+  - task:
+      type: Retrieval
+    dataset:
       name: MTEB ArguAna
       type: mteb/arguana
+      config: default
+      split: test
+      revision: c22ab2a51041ffd869aaddef7af8d8215647e41a
     metrics:
     - type: main_score
       value: 65.269
       value: 67.354
     - type: recall_at_5
       value: 78.236
+  - task:
+      type: Clustering
+    dataset:
       name: MTEB ArxivClusteringP2P
       type: mteb/arxiv-clustering-p2p
+      config: default
+      split: test
+      revision: a122ad7f3f0291bf49cc6f4d32aa80929df69d5d
     metrics:
     - type: main_score
       value: 55.437138353189994
       value: 55.437138353189994
     - type: v_measure_std
       value: 14.718556601335491
+  - task:
       type: Clustering
+    dataset:
       name: MTEB ArxivClusteringS2S
       type: mteb/arxiv-clustering-s2s
+      config: default
+      split: test
+      revision: f910caf1a6075f7329cdf8c1a6135696f37dbd53
     metrics:
     - type: main_score
       value: 50.65858459544658
       value: 50.65858459544658
     - type: v_measure_std
       value: 14.887033747525146
+  - task:
+      type: Reranking
+    dataset:
       name: MTEB AskUbuntuDupQuestions
       type: mteb/askubuntudupquestions-reranking
+      config: default
+      split: test
+      revision: 2000358ca161889fa9c082cb41daa8dcfb161a54
     metrics:
     - type: main_score
       value: 67.32597152838535
       value: 41.64561939958336
     - type: nAUC_mrr_std
       value: 23.179909345891968
+  - task:
+      type: STS
+    dataset:
       name: MTEB BIOSSES
       type: mteb/biosses-sts
+      config: default
+      split: test
+      revision: d3fb88f8f02e40887cd149695127462bbcf29b4a
     metrics:
     - type: cosine_pearson
       value: 85.790820496042
       value: 85.790820496042
     - type: spearman
       value: 83.10731534330517
+  - task:
+      type: Classification
+    dataset:
       name: MTEB Banking77Classification
       type: mteb/banking77
+      config: default
+      split: test
+      revision: 0fd18e25b25c072e09e0d92ab615fda904d66300
     metrics:
     - type: accuracy
       value: 89.78896103896105
       value: 89.76107366333488
     - type: main_score
       value: 89.78896103896105
+  - task:
+      type: Clustering
+    dataset:
       name: MTEB BiorxivClusteringP2P
       type: mteb/biorxiv-clustering-p2p
+      config: default
+      split: test
+      revision: 65b79d1d13f80053f67aca9498d9402c2d9f1f40
     metrics:
     - type: main_score
       value: 50.68092296236376
       value: 50.68092296236376
     - type: v_measure_std
       value: 0.7832640983085436
+  - task:
       type: Clustering
+    dataset:
       name: MTEB BiorxivClusteringS2S
       type: mteb/biorxiv-clustering-s2s
+      config: default
+      split: test
+      revision: 258694dd0231531bc1fd9de6ceb52a0853c6d908
     metrics:
     - type: main_score
       value: 46.86629236732983
       value: 46.86629236732983
     - type: v_measure_std
       value: 0.8784322236350974
+  - task:
+      type: Retrieval
+    dataset:
       name: MTEB CQADupstackRetrieval
       type: mteb/cqadupstack
+      config: default
+      split: test
+      revision: 4ffe81d471b1924886b33c7567bfb200e9eec5c4
     metrics:
     - type: main_score
       value: 47.74883333333334
       value: 46.01841666666666
     - type: recall_at_5
       value: 52.482416666666666
+  - task:
       type: Retrieval
+    dataset:
       name: MTEB ClimateFEVER
       type: mteb/climate-fever
+      config: default
+      split: test
+      revision: 47f2ac6acb640fc46020b02a5b59fdda04d39380
     metrics:
     - type: main_score
       value: 46.113
       value: 35.150999999999996
     - type: recall_at_5
       value: 42.748000000000005
+  - task:
       type: Retrieval
+    dataset:
       name: MTEB DBPedia
       type: mteb/dbpedia
+      config: default
+      split: test
+      revision: c0f706b76e590d620bd6618b3ca8efdd34e2d659
     metrics:
     - type: main_score
       value: 52.276999999999994
       value: 17.876
     - type: recall_at_5
       value: 22.536
+  - task:
+      type: Classification
+    dataset:
       name: MTEB EmotionClassification
       type: mteb/emotion
+      config: default
+      split: test
+      revision: 4f58c6b202a23cf9a4da393831edf4f9183cad37
     metrics:
     - type: accuracy
       value: 84.29499999999999
       value: 84.96026012933847
     - type: main_score
       value: 84.29499999999999
+  - task:
+      type: Retrieval
+    dataset:
       name: MTEB FEVER
       type: mteb/fever
+      config: default
+      split: test
+      revision: bea83ef9e8fb933d90a2f1d5515737465d613e12
     metrics:
     - type: main_score
       value: 94.83200000000001
       value: 95.069
     - type: recall_at_5
       value: 96.177
+  - task:
       type: Retrieval
+    dataset:
       name: MTEB FiQA2018
       type: mteb/fiqa
+      config: default
+      split: test
+      revision: 27a168819829fe9bcd655c2df245fb19452e8e06
     metrics:
     - type: main_score
       value: 60.480000000000004
       value: 50.221000000000004
     - type: recall_at_5
       value: 58.209999999999994
+  - task:
       type: Retrieval
+    dataset:
       name: MTEB HotpotQA
       type: mteb/hotpotqa
+      config: default
+      split: test
+      revision: ab518f4d6fcca38d87c25209f94beba119d02014
     metrics:
     - type: main_score
       value: 76.67399999999999
       value: 68.879
     - type: recall_at_5
       value: 73.896
+  - task:
+      type: Classification
+    dataset:
       name: MTEB ImdbClassification
       type: mteb/imdb
+      config: default
+      split: test
+      revision: 3d86128a09e091d6018b6d26cad27f2739fc2db7
     metrics:
     - type: accuracy
       value: 96.6608
       value: 96.66029695623423
     - type: main_score
       value: 96.6608
+  - task:
+      type: Retrieval
+    dataset:
       name: MTEB MSMARCO
       type: mteb/msmarco
+      config: default
+      split: dev
+      revision: c5a29a104738b98a9e76336939199e264163d4a0
     metrics:
     - type: main_score
       value: 45.217
       value: 45.535
     - type: recall_at_5
       value: 55.394
+  - task:
+      type: Classification
+    dataset:
       name: MTEB MTOPDomainClassification (en)
       type: mteb/mtop_domain
+      config: en
+      split: test
+      revision: d80d48c1eb48d3562165c59d59d0034df9fff0bf
     metrics:
     - type: accuracy
       value: 99.01276789785682
       value: 99.01406884928141
     - type: main_score
       value: 99.01276789785682
+  - task:
       type: Classification
+    dataset:
       name: MTEB MTOPIntentClassification (en)
       type: mteb/mtop_intent
+      config: en
+      split: test
+      revision: ae001d0e6b1228650b7bd1c2c65fb50ad11a8aba
     metrics:
     - type: accuracy
       value: 92.78385772913816
       value: 93.90424147486428
     - type: main_score
       value: 92.78385772913816
+  - task:
       type: Classification
+    dataset:
       name: MTEB MassiveIntentClassification (en)
       type: mteb/amazon_massive_intent
+      config: en
+      split: test
+      revision: 4672e20407010da34463acc759c162ca9734bca6
     metrics:
     - type: accuracy
       value: 85.83053127101546
       value: 85.81759723866098
     - type: main_score
       value: 85.83053127101546
+  - task:
       type: Classification
+    dataset:
       name: MTEB MassiveScenarioClassification (en)
       type: mteb/amazon_massive_scenario
+      config: en
+      split: test
+      revision: fad2c6e8459f9e1c45d9315f4953d921437d70f8
     metrics:
     - type: accuracy
       value: 90.19838601210489
       value: 90.11422965504119
     - type: main_score
       value: 90.19838601210489
+  - task:
+      type: Clustering
+    dataset:
       name: MTEB MedrxivClusteringP2P
       type: mteb/medrxiv-clustering-p2p
+      config: default
+      split: test
+      revision: e7a26af6f3ae46b30dde8737f02c07b1505bcc73
     metrics:
     - type: main_score
       value: 46.866746897607094
       value: 46.866746897607094
     - type: v_measure_std
       value: 1.0966477896919726
+  - task:
       type: Clustering
+    dataset:
       name: MTEB MedrxivClusteringS2S
       type: mteb/medrxiv-clustering-s2s
+      config: default
+      split: test
+      revision: 35191c8c0dca72d8ff3efcd72aa802307d469663
     metrics:
     - type: main_score
       value: 44.6538827415503
       value: 44.6538827415503
     - type: v_measure_std
       value: 1.1649569936599116
+  - task:
+      type: Reranking
+    dataset:
       name: MTEB MindSmallReranking
       type: mteb/mind_small
+      config: default
+      split: test
+      revision: 59042f120c80e8afa9cdbb224f67076cec0fc9a7
     metrics:
     - type: main_score
       value: 33.05449204940555
       value: -15.304687384645769
     - type: nAUC_mrr_std
       value: -0.519919931348978
+  - task:
+      type: Retrieval
+    dataset:
       name: MTEB NFCorpus
       type: mteb/nfcorpus
+      config: default
+      split: test
+      revision: ec0fa4fe99da2ff19ca1214b7966684033a58814
     metrics:
     - type: main_score
       value: 41.998000000000005
       value: 13.267999999999999
     - type: recall_at_5
       value: 16.141
+  - task:
       type: Retrieval
+    dataset:
       name: MTEB NQ
       type: mteb/nq
+      config: default
+      split: test
+      revision: b774495ed302d8c44a3a7ea25c90dbce03968f31
     metrics:
     - type: main_score
       value: 71.8
       value: 74.394
     - type: recall_at_5
       value: 82.711
+  - task:
       type: Retrieval
+    dataset:
       name: MTEB QuoraRetrieval
       type: mteb/quora
+      config: default
+      split: test
+      revision: e4e08e0b7dbe3c8700f0daef558ff32256715259
     metrics:
     - type: main_score
       value: 90.025
       value: 89.276
     - type: recall_at_5
       value: 93.46
+  - task:
+      type: Clustering
+    dataset:
       name: MTEB RedditClustering
       type: mteb/reddit-clustering
+      config: default
+      split: test
+      revision: 24640382cdbf8abc73003fb0fa6d111a705499eb
     metrics:
     - type: main_score
       value: 72.86492101891123
       value: 72.86492101891123
     - type: v_measure_std
       value: 2.778711445144635
+  - task:
       type: Clustering
+    dataset:
       name: MTEB RedditClusteringP2P
       type: mteb/reddit-clustering-p2p
+      config: default
+      split: test
+      revision: 385e3cb46b4cfa89021f56c4380204149d0efe33
     metrics:
     - type: main_score
       value: 75.27316726548479
       value: 75.27316726548479
     - type: v_measure_std
       value: 8.87871936725338
+  - task:
+      type: Retrieval
+    dataset:
       name: MTEB SCIDOCS
       type: mteb/scidocs
+      config: default
+      split: test
+      revision: f8c2fcf00f625baaa80f62ec5bd9e1fff3b8ae88
     metrics:
     - type: main_score
       value: 26.638
       value: 14.127999999999998
     - type: recall_at_5
       value: 19.673
+  - task:
+      type: STS
+    dataset:
       name: MTEB SICK-R
       type: mteb/sickr-sts
+      config: default
+      split: test
+      revision: 20a6d6f312dd54037fe07a32d58e5e168867909d
     metrics:
     - type: cosine_pearson
       value: 86.86608529160739
       value: 86.86608529160739
     - type: spearman
       value: 82.88625166203383
+  - task:
       type: STS
+    dataset:
       name: MTEB STS12
       type: mteb/sts12-sts
+      config: default
+      split: test
+      revision: a0d554a64d88156834ff5ae9920b964011b16384
     metrics:
     - type: cosine_pearson
       value: 87.0445014940449
       value: 87.0445014940449
     - type: spearman
       value: 80.0880365116599
+  - task:
       type: STS
+    dataset:
       name: MTEB STS13
       type: mteb/sts13-sts
+      config: default
+      split: test
+      revision: 7e90230a92c190f1bf69ae9002b8cea547a64cca
     metrics:
     - type: cosine_pearson
       value: 89.33900828959968
       value: 89.33900828959968
     - type: spearman
       value: 89.68256358526733
+  - task:
       type: STS
+    dataset:
       name: MTEB STS14
       type: mteb/sts14-sts
+      config: default
+      split: test
+      revision: 6031580fec1f6af667f0bd2da0a551cf4f0b2375
     metrics:
     - type: cosine_pearson
       value: 86.42029843639123
       value: 86.42029843639123
     - type: spearman
       value: 85.0707889220723
+  - task:
       type: STS
+    dataset:
       name: MTEB STS15
       type: mteb/sts15-sts
+      config: default
+      split: test
+      revision: ae752c7c21bf194d8b67fd573edf7ae58183cbe3
     metrics:
     - type: cosine_pearson
       value: 88.3660081271444
       value: 88.3660081271444
     - type: spearman
       value: 89.39375083609528
+  - task:
       type: STS
+    dataset:
       name: MTEB STS16
       type: mteb/sts16-sts
+      config: default
+      split: test
+      revision: 4d8694f8f0e0100860b497b999b3dbed754a0513
     metrics:
     - type: cosine_pearson
       value: 85.60708247171874
       value: 85.60708247171874
     - type: spearman
       value: 87.15234952832193
+  - task:
       type: STS
+    dataset:
       name: MTEB STS17 (en-en)
       type: mteb/sts17-crosslingual-sts
+      config: en-en
+      split: test
+      revision: faeb762787bd10488a50c8b5be4a3b82e411949c
     metrics:
     - type: cosine_pearson
       value: 91.25898556808458
       value: 91.25898556808458
     - type: spearman
       value: 91.35372390581641
+  - task:
       type: STS
+    dataset:
       name: MTEB STS22 (en)
       type: mteb/sts22-crosslingual-sts
+      config: en
+      split: test
+      revision: de9d86b3b84231dc21f76c7b7af1f28e2f57f6e3
     metrics:
     - type: cosine_pearson
       value: 67.61637111515797
       value: 67.61637111515797
     - type: spearman
       value: 68.10379096526697
+  - task:
       type: STS
+    dataset:
       name: MTEB STSBenchmark
       type: mteb/stsbenchmark-sts
+      config: default
+      split: test
+      revision: b0fddb56ed78048fa8b90373c8a3cfc37b684831
     metrics:
     - type: cosine_pearson
       value: 87.81592853782297
       value: 87.81592853782297
     - type: spearman
       value: 88.2302550329183
+  - task:
+      type: Reranking
+    dataset:
       name: MTEB SciDocsRR
       type: mteb/scidocs-reranking
+      config: default
+      split: test
+      revision: d3c5e1fc0b855ab6097bf1cda04dd73947d7caab
     metrics:
     - type: main_score
       value: 89.196009707431
       value: 86.38341077184032
     - type: nAUC_mrr_std
       value: 75.38945014727746
+  - task:
+      type: Retrieval
+    dataset:
       name: MTEB SciFact
       type: mteb/scifact
+      config: default
+      split: test
+      revision: 0228b52cf27578f30900b9e5271d331663a030d7
     metrics:
     - type: main_score
       value: 80.08999999999999
       value: 80.972
     - type: recall_at_5
       value: 89.90599999999999
+  - task:
+      type: PairClassification
+    dataset:
       name: MTEB SprintDuplicateQuestions
       type: mteb/sprintduplicatequestions-pairclassification
+      config: default
+      split: test
+      revision: d66bd1f72af766a5cc4b0ca5e00c162f89e8cc46
     metrics:
     - type: cosine_accuracy
       value: 99.81881188118813
       value: 92.59645464025026
     - type: similarity_recall
       value: 88.8
+  - task:
+      type: Clustering
+    dataset:
       name: MTEB StackExchangeClustering
       type: mteb/stackexchange-clustering
+      config: default
+      split: test
+      revision: 6cbc1f7b2bc0622f2e39d2c77fa502909748c259
     metrics:
     - type: main_score
       value: 80.28558559137414
       value: 80.28558559137414
     - type: v_measure_std
       value: 2.795276520287584
+  - task:
       type: Clustering
+    dataset:
       name: MTEB StackExchangeClusteringP2P
       type: mteb/stackexchange-clustering-p2p
+      config: default
+      split: test
+      revision: 815ca46b2622cec33ccafc3735d572c266efdb44
     metrics:
     - type: main_score
       value: 49.57135582416209
       value: 49.57135582416209
     - type: v_measure_std
       value: 1.6414135468423754
+  - task:
+      type: Reranking
+    dataset:
       name: MTEB StackOverflowDupQuestions
       type: mteb/stackoverflowdupquestions-reranking
+      config: default
+      split: test
+      revision: e185fbe320c72810689fc5848eb6114e1ef5ec69
     metrics:
     - type: main_score
       value: 55.253002583598644
       value: 10.586310195339053
     - type: nAUC_mrr_std
       value: 8.47326494370076
+  - task:
+      type: Summarization
+    dataset:
       name: MTEB SummEval
       type: mteb/summeval
+      config: default
+      split: test
+      revision: cda12ad7615edc362dbf25a00fdd61d3b1eaf93c
     metrics:
     - type: cosine_pearson
       value: 31.19874648747059
       value: 31.19874648747059
     - type: spearman
       value: 31.493550648844863
+  - task:
+      type: Retrieval
+    dataset:
       name: MTEB TRECCOVID
       type: mteb/trec-covid
+      config: default
+      split: test
+      revision: bb9466bac8153a0349341eb1b22e06409e78ef4e
     metrics:
     - type: main_score
       value: 85.983
       value: 0.7250000000000001
     - type: recall_at_5
       value: 1.1820000000000002
+  - task:
       type: Retrieval
+    dataset:
       name: MTEB Touche2020
       type: mteb/touche2020
+      config: default
+      split: test
+      revision: a34f9a33db75fa0cbb21bb5cfc3dae8dc8bec93f
     metrics:
     - type: main_score
       value: 29.944
       value: 7.383000000000001
     - type: recall_at_5
       value: 11.434
+  - task:
+      type: Classification
+    dataset:
       name: MTEB ToxicConversationsClassification
       type: mteb/toxic_conversations_50k
+      config: default
+      split: test
+      revision: edfaf9da55d3dd50d43143d90c1ac476895ae6de
     metrics:
     - type: accuracy
       value: 88.759765625
       value: 90.54372649306606
     - type: main_score
       value: 88.759765625
+  - task:
       type: Classification
+    dataset:
       name: MTEB TweetSentimentExtractionClassification
       type: mteb/tweet_sentiment_extraction
+      config: default
+      split: test
+      revision: d604517c81ca91fe16a244d1248fc021f9ecee7a
     metrics:
     - type: accuracy
       value: 74.8443689869836
       value: 74.7369003946243
     - type: main_score
       value: 74.8443689869836
+  - task:
+      type: Clustering
+    dataset:
       name: MTEB TwentyNewsgroupsClustering
       type: mteb/twentynewsgroups-clustering
+      config: default
+      split: test
+      revision: 6125ec4e24fa026cec8a478383ee943acfbd5449
     metrics:
     - type: main_score
       value: 61.42918790942448
       value: 61.42918790942448
     - type: v_measure_std
       value: 1.0156550098843082
+  - task:
+      type: PairClassification
+    dataset:
       name: MTEB TwitterSemEval2015
       type: mteb/twittersemeval2015-pairclassification
+      config: default
+      split: test
+      revision: 70970daeab8776df92f5ea462b6173c0b46fd2d1
     metrics:
     - type: cosine_accuracy
       value: 88.22197055492639
       value: 71.64922770303936
     - type: similarity_recall
       value: 75.8839050131926
+  - task:
       type: PairClassification
+    dataset:
       name: MTEB TwitterURLCorpus
       type: mteb/twitterurlcorpus-pairclassification
+      config: default
+      split: test
+      revision: 8b6510b0b1fa4e4c4f879467980e9be563ec1cdf
     metrics:
     - type: cosine_accuracy
       value: 89.88628866379477
       value: 76.93126197063205
     - type: similarity_recall
       value: 83.50015398829689
 ---

onnx/added_tokens.json ADDED Viewed

	@@ -0,0 +1,5 @@

+{
+  "<|endoftext|>": 151643,
+  "<|im_end|>": 151645,
+  "<|im_start|>": 151644
+}

onnx/config.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+  "_attn_implementation_autoset": true,
+  "architectures": [
+    "Qwen2ForCausalLM"
+  ],
+  "attention_dropout": 0.0,
+  "auto_map": {
+    "AutoModel": "NovaSearch/stella_en_1.5B_v5--modeling_qwen.Qwen2Model",
+    "AutoModelForCausalLM": "NovaSearch/stella_en_1.5B_v5--modeling_qwen.Qwen2ForCausalLM",
+    "AutoModelForSequenceClassification": "NovaSearch/stella_en_1.5B_v5--modeling_qwen.Qwen2ForSequenceClassification"
+  },
+  "bos_token_id": 151643,
+  "eos_token_id": 151643,
+  "export_model_type": "transformer",
+  "hidden_act": "silu",
+  "hidden_size": 1536,
+  "initializer_range": 0.02,
+  "intermediate_size": 8960,
+  "max_position_embeddings": 131072,
+  "max_window_layers": 21,
+  "model_type": "qwen2",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 28,
+  "num_key_value_heads": 2,
+  "rms_norm_eps": 1e-06,
+  "rope_scaling": null,
+  "rope_theta": 1000000.0,
+  "sliding_window": 131072,
+  "tie_word_embeddings": false,
+  "torch_dtype": "float32",
+  "transformers_version": "4.51.3",
+  "use_cache": true,
+  "use_sliding_window": false,
+  "vocab_size": 151646
+}

onnx/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

onnx/model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8b8d12c8210ae19b00bbdca6ddfe3d70da0d46312c72bcfa1fd6e3707cfdd7d2
-size 874851

 version https://git-lfs.github.com/spec/v1
+oid sha256:6b44c618d7f278c8b171a78c6635b844caa144556b46d144ecaaac8562f6f927
+size 1430611

onnx/model.onnx_data CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4d9d0ac35b704186bd6bf7d969ebccc7929e0cb13acae9f088a061e433141f29
-size 6313588736

 version https://git-lfs.github.com/spec/v1
+oid sha256:b96b4485d9715a6efb678336ed8069976eca6d7b85f05188f3142ffb0561f667
+size 6179371008

onnx/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,20 @@

+{
+  "additional_special_tokens": [
+    "<|im_start|>",
+    "<|im_end|>"
+  ],
+  "eos_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

onnx/tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d8372feaa064372d176aff57e8f1e64f194814bb074519104f64c66a2825f091
+size 11419037

onnx/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,51 @@

+{
+  "add_eos_token": true,
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "151643": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151644": {
+      "content": "<|im_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151645": {
+      "content": "<|im_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "additional_special_tokens": [
+    "<|im_start|>",
+    "<|im_end|>"
+  ],
+  "auto_map": {
+    "AutoTokenizer": [
+      "NovaSearch/stella_en_1.5B_v5--tokenization_qwen.Qwen2Tokenizer",
+      "NovaSearch/stella_en_1.5B_v5--tokenization_qwen.Qwen2TokenizerFast"
+    ]
+  },
+  "bos_token": null,
+  "chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<|endoftext|>",
+  "errors": "replace",
+  "extra_special_tokens": {},
+  "model_max_length": 32768,
+  "pad_token": "<|endoftext|>",
+  "split_special_tokens": false,
+  "tokenizer_class": "Qwen2Tokenizer",
+  "unk_token": null
+}

onnx/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff