abukhoyer commited on
Commit
6764ba7
·
verified ·
1 Parent(s): 7817065

Adding ONNX file of this model

Browse files

Beep boop I am the [ONNX export bot 🤖🏎️](https://huggingface.co/spaces/onnx/export). On behalf of [abukhoyer](https://huggingface.co/abukhoyer), I would like to add to this repository the model converted to ONNX.

What is ONNX? It stands for "Open Neural Network Exchange", and is the most commonly used open standard for machine learning interoperability. You can find out more at [onnx.ai](https://onnx.ai/)!

The exported ONNX model can be then be consumed by various backends as TensorRT or TVM, or simply be used in a few lines with 🤗 Optimum through ONNX Runtime, check out how [here](https://huggingface.co/docs/optimum/main/en/onnxruntime/usage_guides/models)!

.gitattributes CHANGED
@@ -35,3 +35,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  onnx/model.onnx_data filter=lfs diff=lfs merge=lfs -text
37
  onnx/model_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
 
 
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  onnx/model.onnx_data filter=lfs diff=lfs merge=lfs -text
37
  onnx/model_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
38
+ onnx/tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
@@ -1,13 +1,22 @@
1
  ---
 
 
 
 
 
 
 
2
  model-index:
3
  - name: stella_en_1.5B_v5
4
  results:
5
- - dataset:
6
- config: en
 
7
  name: MTEB AmazonCounterfactualClassification (en)
8
- revision: e8379541af4e31359cca9fbcf4b00f2671dba205
9
- split: test
10
  type: mteb/amazon_counterfactual
 
 
 
11
  metrics:
12
  - type: accuracy
13
  value: 92.86567164179104
@@ -21,14 +30,14 @@ model-index:
21
  value: 93.13621183004571
22
  - type: main_score
23
  value: 92.86567164179104
24
- task:
25
  type: Classification
26
- - dataset:
27
- config: default
28
  name: MTEB AmazonPolarityClassification
29
- revision: e2d317d38cd51312af73b3d32a06d1a08b442046
30
- split: test
31
  type: mteb/amazon_polarity
 
 
 
32
  metrics:
33
  - type: accuracy
34
  value: 97.16485
@@ -42,14 +51,14 @@ model-index:
42
  value: 97.16351087403213
43
  - type: main_score
44
  value: 97.16485
45
- task:
46
  type: Classification
47
- - dataset:
48
- config: en
49
  name: MTEB AmazonReviewsClassification (en)
50
- revision: 1399c76144fd37290681b995c656ef9b2e06e26d
51
- split: test
52
  type: mteb/amazon_reviews_multi
 
 
 
53
  metrics:
54
  - type: accuracy
55
  value: 59.358
@@ -59,14 +68,14 @@ model-index:
59
  value: 59.0264615883114
60
  - type: main_score
61
  value: 59.358
62
- task:
63
- type: Classification
64
- - dataset:
65
- config: default
66
  name: MTEB ArguAna
67
- revision: c22ab2a51041ffd869aaddef7af8d8215647e41a
68
- split: test
69
  type: mteb/arguana
 
 
 
70
  metrics:
71
  - type: main_score
72
  value: 65.269
@@ -350,14 +359,14 @@ model-index:
350
  value: 67.354
351
  - type: recall_at_5
352
  value: 78.236
353
- task:
354
- type: Retrieval
355
- - dataset:
356
- config: default
357
  name: MTEB ArxivClusteringP2P
358
- revision: a122ad7f3f0291bf49cc6f4d32aa80929df69d5d
359
- split: test
360
  type: mteb/arxiv-clustering-p2p
 
 
 
361
  metrics:
362
  - type: main_score
363
  value: 55.437138353189994
@@ -365,14 +374,14 @@ model-index:
365
  value: 55.437138353189994
366
  - type: v_measure_std
367
  value: 14.718556601335491
368
- task:
369
  type: Clustering
370
- - dataset:
371
- config: default
372
  name: MTEB ArxivClusteringS2S
373
- revision: f910caf1a6075f7329cdf8c1a6135696f37dbd53
374
- split: test
375
  type: mteb/arxiv-clustering-s2s
 
 
 
376
  metrics:
377
  - type: main_score
378
  value: 50.65858459544658
@@ -380,14 +389,14 @@ model-index:
380
  value: 50.65858459544658
381
  - type: v_measure_std
382
  value: 14.887033747525146
383
- task:
384
- type: Clustering
385
- - dataset:
386
- config: default
387
  name: MTEB AskUbuntuDupQuestions
388
- revision: 2000358ca161889fa9c082cb41daa8dcfb161a54
389
- split: test
390
  type: mteb/askubuntudupquestions-reranking
 
 
 
391
  metrics:
392
  - type: main_score
393
  value: 67.32597152838535
@@ -407,14 +416,14 @@ model-index:
407
  value: 41.64561939958336
408
  - type: nAUC_mrr_std
409
  value: 23.179909345891968
410
- task:
411
- type: Reranking
412
- - dataset:
413
- config: default
414
  name: MTEB BIOSSES
415
- revision: d3fb88f8f02e40887cd149695127462bbcf29b4a
416
- split: test
417
  type: mteb/biosses-sts
 
 
 
418
  metrics:
419
  - type: cosine_pearson
420
  value: 85.790820496042
@@ -434,14 +443,14 @@ model-index:
434
  value: 85.790820496042
435
  - type: spearman
436
  value: 83.10731534330517
437
- task:
438
- type: STS
439
- - dataset:
440
- config: default
441
  name: MTEB Banking77Classification
442
- revision: 0fd18e25b25c072e09e0d92ab615fda904d66300
443
- split: test
444
  type: mteb/banking77
 
 
 
445
  metrics:
446
  - type: accuracy
447
  value: 89.78896103896105
@@ -451,14 +460,14 @@ model-index:
451
  value: 89.76107366333488
452
  - type: main_score
453
  value: 89.78896103896105
454
- task:
455
- type: Classification
456
- - dataset:
457
- config: default
458
  name: MTEB BiorxivClusteringP2P
459
- revision: 65b79d1d13f80053f67aca9498d9402c2d9f1f40
460
- split: test
461
  type: mteb/biorxiv-clustering-p2p
 
 
 
462
  metrics:
463
  - type: main_score
464
  value: 50.68092296236376
@@ -466,14 +475,14 @@ model-index:
466
  value: 50.68092296236376
467
  - type: v_measure_std
468
  value: 0.7832640983085436
469
- task:
470
  type: Clustering
471
- - dataset:
472
- config: default
473
  name: MTEB BiorxivClusteringS2S
474
- revision: 258694dd0231531bc1fd9de6ceb52a0853c6d908
475
- split: test
476
  type: mteb/biorxiv-clustering-s2s
 
 
 
477
  metrics:
478
  - type: main_score
479
  value: 46.86629236732983
@@ -481,14 +490,14 @@ model-index:
481
  value: 46.86629236732983
482
  - type: v_measure_std
483
  value: 0.8784322236350974
484
- task:
485
- type: Clustering
486
- - dataset:
487
- config: default
488
  name: MTEB CQADupstackRetrieval
489
- revision: 4ffe81d471b1924886b33c7567bfb200e9eec5c4
490
- split: test
491
  type: mteb/cqadupstack
 
 
 
492
  metrics:
493
  - type: main_score
494
  value: 47.74883333333334
@@ -772,14 +781,14 @@ model-index:
772
  value: 46.01841666666666
773
  - type: recall_at_5
774
  value: 52.482416666666666
775
- task:
776
  type: Retrieval
777
- - dataset:
778
- config: default
779
  name: MTEB ClimateFEVER
780
- revision: 47f2ac6acb640fc46020b02a5b59fdda04d39380
781
- split: test
782
  type: mteb/climate-fever
 
 
 
783
  metrics:
784
  - type: main_score
785
  value: 46.113
@@ -1063,14 +1072,14 @@ model-index:
1063
  value: 35.150999999999996
1064
  - type: recall_at_5
1065
  value: 42.748000000000005
1066
- task:
1067
  type: Retrieval
1068
- - dataset:
1069
- config: default
1070
  name: MTEB DBPedia
1071
- revision: c0f706b76e590d620bd6618b3ca8efdd34e2d659
1072
- split: test
1073
  type: mteb/dbpedia
 
 
 
1074
  metrics:
1075
  - type: main_score
1076
  value: 52.276999999999994
@@ -1354,14 +1363,14 @@ model-index:
1354
  value: 17.876
1355
  - type: recall_at_5
1356
  value: 22.536
1357
- task:
1358
- type: Retrieval
1359
- - dataset:
1360
- config: default
1361
  name: MTEB EmotionClassification
1362
- revision: 4f58c6b202a23cf9a4da393831edf4f9183cad37
1363
- split: test
1364
  type: mteb/emotion
 
 
 
1365
  metrics:
1366
  - type: accuracy
1367
  value: 84.29499999999999
@@ -1371,14 +1380,14 @@ model-index:
1371
  value: 84.96026012933847
1372
  - type: main_score
1373
  value: 84.29499999999999
1374
- task:
1375
- type: Classification
1376
- - dataset:
1377
- config: default
1378
  name: MTEB FEVER
1379
- revision: bea83ef9e8fb933d90a2f1d5515737465d613e12
1380
- split: test
1381
  type: mteb/fever
 
 
 
1382
  metrics:
1383
  - type: main_score
1384
  value: 94.83200000000001
@@ -1662,14 +1671,14 @@ model-index:
1662
  value: 95.069
1663
  - type: recall_at_5
1664
  value: 96.177
1665
- task:
1666
  type: Retrieval
1667
- - dataset:
1668
- config: default
1669
  name: MTEB FiQA2018
1670
- revision: 27a168819829fe9bcd655c2df245fb19452e8e06
1671
- split: test
1672
  type: mteb/fiqa
 
 
 
1673
  metrics:
1674
  - type: main_score
1675
  value: 60.480000000000004
@@ -1953,14 +1962,14 @@ model-index:
1953
  value: 50.221000000000004
1954
  - type: recall_at_5
1955
  value: 58.209999999999994
1956
- task:
1957
  type: Retrieval
1958
- - dataset:
1959
- config: default
1960
  name: MTEB HotpotQA
1961
- revision: ab518f4d6fcca38d87c25209f94beba119d02014
1962
- split: test
1963
  type: mteb/hotpotqa
 
 
 
1964
  metrics:
1965
  - type: main_score
1966
  value: 76.67399999999999
@@ -2244,14 +2253,14 @@ model-index:
2244
  value: 68.879
2245
  - type: recall_at_5
2246
  value: 73.896
2247
- task:
2248
- type: Retrieval
2249
- - dataset:
2250
- config: default
2251
  name: MTEB ImdbClassification
2252
- revision: 3d86128a09e091d6018b6d26cad27f2739fc2db7
2253
- split: test
2254
  type: mteb/imdb
 
 
 
2255
  metrics:
2256
  - type: accuracy
2257
  value: 96.6608
@@ -2265,14 +2274,14 @@ model-index:
2265
  value: 96.66029695623423
2266
  - type: main_score
2267
  value: 96.6608
2268
- task:
2269
- type: Classification
2270
- - dataset:
2271
- config: default
2272
  name: MTEB MSMARCO
2273
- revision: c5a29a104738b98a9e76336939199e264163d4a0
2274
- split: dev
2275
  type: mteb/msmarco
 
 
 
2276
  metrics:
2277
  - type: main_score
2278
  value: 45.217
@@ -2556,14 +2565,14 @@ model-index:
2556
  value: 45.535
2557
  - type: recall_at_5
2558
  value: 55.394
2559
- task:
2560
- type: Retrieval
2561
- - dataset:
2562
- config: en
2563
  name: MTEB MTOPDomainClassification (en)
2564
- revision: d80d48c1eb48d3562165c59d59d0034df9fff0bf
2565
- split: test
2566
  type: mteb/mtop_domain
 
 
 
2567
  metrics:
2568
  - type: accuracy
2569
  value: 99.01276789785682
@@ -2573,14 +2582,14 @@ model-index:
2573
  value: 99.01406884928141
2574
  - type: main_score
2575
  value: 99.01276789785682
2576
- task:
2577
  type: Classification
2578
- - dataset:
2579
- config: en
2580
  name: MTEB MTOPIntentClassification (en)
2581
- revision: ae001d0e6b1228650b7bd1c2c65fb50ad11a8aba
2582
- split: test
2583
  type: mteb/mtop_intent
 
 
 
2584
  metrics:
2585
  - type: accuracy
2586
  value: 92.78385772913816
@@ -2590,14 +2599,14 @@ model-index:
2590
  value: 93.90424147486428
2591
  - type: main_score
2592
  value: 92.78385772913816
2593
- task:
2594
  type: Classification
2595
- - dataset:
2596
- config: en
2597
  name: MTEB MassiveIntentClassification (en)
2598
- revision: 4672e20407010da34463acc759c162ca9734bca6
2599
- split: test
2600
  type: mteb/amazon_massive_intent
 
 
 
2601
  metrics:
2602
  - type: accuracy
2603
  value: 85.83053127101546
@@ -2607,14 +2616,14 @@ model-index:
2607
  value: 85.81759723866098
2608
  - type: main_score
2609
  value: 85.83053127101546
2610
- task:
2611
  type: Classification
2612
- - dataset:
2613
- config: en
2614
  name: MTEB MassiveScenarioClassification (en)
2615
- revision: fad2c6e8459f9e1c45d9315f4953d921437d70f8
2616
- split: test
2617
  type: mteb/amazon_massive_scenario
 
 
 
2618
  metrics:
2619
  - type: accuracy
2620
  value: 90.19838601210489
@@ -2624,14 +2633,14 @@ model-index:
2624
  value: 90.11422965504119
2625
  - type: main_score
2626
  value: 90.19838601210489
2627
- task:
2628
- type: Classification
2629
- - dataset:
2630
- config: default
2631
  name: MTEB MedrxivClusteringP2P
2632
- revision: e7a26af6f3ae46b30dde8737f02c07b1505bcc73
2633
- split: test
2634
  type: mteb/medrxiv-clustering-p2p
 
 
 
2635
  metrics:
2636
  - type: main_score
2637
  value: 46.866746897607094
@@ -2639,14 +2648,14 @@ model-index:
2639
  value: 46.866746897607094
2640
  - type: v_measure_std
2641
  value: 1.0966477896919726
2642
- task:
2643
  type: Clustering
2644
- - dataset:
2645
- config: default
2646
  name: MTEB MedrxivClusteringS2S
2647
- revision: 35191c8c0dca72d8ff3efcd72aa802307d469663
2648
- split: test
2649
  type: mteb/medrxiv-clustering-s2s
 
 
 
2650
  metrics:
2651
  - type: main_score
2652
  value: 44.6538827415503
@@ -2654,14 +2663,14 @@ model-index:
2654
  value: 44.6538827415503
2655
  - type: v_measure_std
2656
  value: 1.1649569936599116
2657
- task:
2658
- type: Clustering
2659
- - dataset:
2660
- config: default
2661
  name: MTEB MindSmallReranking
2662
- revision: 59042f120c80e8afa9cdbb224f67076cec0fc9a7
2663
- split: test
2664
  type: mteb/mind_small
 
 
 
2665
  metrics:
2666
  - type: main_score
2667
  value: 33.05449204940555
@@ -2681,14 +2690,14 @@ model-index:
2681
  value: -15.304687384645769
2682
  - type: nAUC_mrr_std
2683
  value: -0.519919931348978
2684
- task:
2685
- type: Reranking
2686
- - dataset:
2687
- config: default
2688
  name: MTEB NFCorpus
2689
- revision: ec0fa4fe99da2ff19ca1214b7966684033a58814
2690
- split: test
2691
  type: mteb/nfcorpus
 
 
 
2692
  metrics:
2693
  - type: main_score
2694
  value: 41.998000000000005
@@ -2972,14 +2981,14 @@ model-index:
2972
  value: 13.267999999999999
2973
  - type: recall_at_5
2974
  value: 16.141
2975
- task:
2976
  type: Retrieval
2977
- - dataset:
2978
- config: default
2979
  name: MTEB NQ
2980
- revision: b774495ed302d8c44a3a7ea25c90dbce03968f31
2981
- split: test
2982
  type: mteb/nq
 
 
 
2983
  metrics:
2984
  - type: main_score
2985
  value: 71.8
@@ -3263,14 +3272,14 @@ model-index:
3263
  value: 74.394
3264
  - type: recall_at_5
3265
  value: 82.711
3266
- task:
3267
  type: Retrieval
3268
- - dataset:
3269
- config: default
3270
  name: MTEB QuoraRetrieval
3271
- revision: e4e08e0b7dbe3c8700f0daef558ff32256715259
3272
- split: test
3273
  type: mteb/quora
 
 
 
3274
  metrics:
3275
  - type: main_score
3276
  value: 90.025
@@ -3554,14 +3563,14 @@ model-index:
3554
  value: 89.276
3555
  - type: recall_at_5
3556
  value: 93.46
3557
- task:
3558
- type: Retrieval
3559
- - dataset:
3560
- config: default
3561
  name: MTEB RedditClustering
3562
- revision: 24640382cdbf8abc73003fb0fa6d111a705499eb
3563
- split: test
3564
  type: mteb/reddit-clustering
 
 
 
3565
  metrics:
3566
  - type: main_score
3567
  value: 72.86492101891123
@@ -3569,14 +3578,14 @@ model-index:
3569
  value: 72.86492101891123
3570
  - type: v_measure_std
3571
  value: 2.778711445144635
3572
- task:
3573
  type: Clustering
3574
- - dataset:
3575
- config: default
3576
  name: MTEB RedditClusteringP2P
3577
- revision: 385e3cb46b4cfa89021f56c4380204149d0efe33
3578
- split: test
3579
  type: mteb/reddit-clustering-p2p
 
 
 
3580
  metrics:
3581
  - type: main_score
3582
  value: 75.27316726548479
@@ -3584,14 +3593,14 @@ model-index:
3584
  value: 75.27316726548479
3585
  - type: v_measure_std
3586
  value: 8.87871936725338
3587
- task:
3588
- type: Clustering
3589
- - dataset:
3590
- config: default
3591
  name: MTEB SCIDOCS
3592
- revision: f8c2fcf00f625baaa80f62ec5bd9e1fff3b8ae88
3593
- split: test
3594
  type: mteb/scidocs
 
 
 
3595
  metrics:
3596
  - type: main_score
3597
  value: 26.638
@@ -3875,14 +3884,14 @@ model-index:
3875
  value: 14.127999999999998
3876
  - type: recall_at_5
3877
  value: 19.673
3878
- task:
3879
- type: Retrieval
3880
- - dataset:
3881
- config: default
3882
  name: MTEB SICK-R
3883
- revision: 20a6d6f312dd54037fe07a32d58e5e168867909d
3884
- split: test
3885
  type: mteb/sickr-sts
 
 
 
3886
  metrics:
3887
  - type: cosine_pearson
3888
  value: 86.86608529160739
@@ -3902,14 +3911,14 @@ model-index:
3902
  value: 86.86608529160739
3903
  - type: spearman
3904
  value: 82.88625166203383
3905
- task:
3906
  type: STS
3907
- - dataset:
3908
- config: default
3909
  name: MTEB STS12
3910
- revision: a0d554a64d88156834ff5ae9920b964011b16384
3911
- split: test
3912
  type: mteb/sts12-sts
 
 
 
3913
  metrics:
3914
  - type: cosine_pearson
3915
  value: 87.0445014940449
@@ -3929,14 +3938,14 @@ model-index:
3929
  value: 87.0445014940449
3930
  - type: spearman
3931
  value: 80.0880365116599
3932
- task:
3933
  type: STS
3934
- - dataset:
3935
- config: default
3936
  name: MTEB STS13
3937
- revision: 7e90230a92c190f1bf69ae9002b8cea547a64cca
3938
- split: test
3939
  type: mteb/sts13-sts
 
 
 
3940
  metrics:
3941
  - type: cosine_pearson
3942
  value: 89.33900828959968
@@ -3956,14 +3965,14 @@ model-index:
3956
  value: 89.33900828959968
3957
  - type: spearman
3958
  value: 89.68256358526733
3959
- task:
3960
  type: STS
3961
- - dataset:
3962
- config: default
3963
  name: MTEB STS14
3964
- revision: 6031580fec1f6af667f0bd2da0a551cf4f0b2375
3965
- split: test
3966
  type: mteb/sts14-sts
 
 
 
3967
  metrics:
3968
  - type: cosine_pearson
3969
  value: 86.42029843639123
@@ -3983,14 +3992,14 @@ model-index:
3983
  value: 86.42029843639123
3984
  - type: spearman
3985
  value: 85.0707889220723
3986
- task:
3987
  type: STS
3988
- - dataset:
3989
- config: default
3990
  name: MTEB STS15
3991
- revision: ae752c7c21bf194d8b67fd573edf7ae58183cbe3
3992
- split: test
3993
  type: mteb/sts15-sts
 
 
 
3994
  metrics:
3995
  - type: cosine_pearson
3996
  value: 88.3660081271444
@@ -4010,14 +4019,14 @@ model-index:
4010
  value: 88.3660081271444
4011
  - type: spearman
4012
  value: 89.39375083609528
4013
- task:
4014
  type: STS
4015
- - dataset:
4016
- config: default
4017
  name: MTEB STS16
4018
- revision: 4d8694f8f0e0100860b497b999b3dbed754a0513
4019
- split: test
4020
  type: mteb/sts16-sts
 
 
 
4021
  metrics:
4022
  - type: cosine_pearson
4023
  value: 85.60708247171874
@@ -4037,14 +4046,14 @@ model-index:
4037
  value: 85.60708247171874
4038
  - type: spearman
4039
  value: 87.15234952832193
4040
- task:
4041
  type: STS
4042
- - dataset:
4043
- config: en-en
4044
  name: MTEB STS17 (en-en)
4045
- revision: faeb762787bd10488a50c8b5be4a3b82e411949c
4046
- split: test
4047
  type: mteb/sts17-crosslingual-sts
 
 
 
4048
  metrics:
4049
  - type: cosine_pearson
4050
  value: 91.25898556808458
@@ -4064,14 +4073,14 @@ model-index:
4064
  value: 91.25898556808458
4065
  - type: spearman
4066
  value: 91.35372390581641
4067
- task:
4068
  type: STS
4069
- - dataset:
4070
- config: en
4071
  name: MTEB STS22 (en)
4072
- revision: de9d86b3b84231dc21f76c7b7af1f28e2f57f6e3
4073
- split: test
4074
  type: mteb/sts22-crosslingual-sts
 
 
 
4075
  metrics:
4076
  - type: cosine_pearson
4077
  value: 67.61637111515797
@@ -4091,14 +4100,14 @@ model-index:
4091
  value: 67.61637111515797
4092
  - type: spearman
4093
  value: 68.10379096526697
4094
- task:
4095
  type: STS
4096
- - dataset:
4097
- config: default
4098
  name: MTEB STSBenchmark
4099
- revision: b0fddb56ed78048fa8b90373c8a3cfc37b684831
4100
- split: test
4101
  type: mteb/stsbenchmark-sts
 
 
 
4102
  metrics:
4103
  - type: cosine_pearson
4104
  value: 87.81592853782297
@@ -4118,14 +4127,14 @@ model-index:
4118
  value: 87.81592853782297
4119
  - type: spearman
4120
  value: 88.2302550329183
4121
- task:
4122
- type: STS
4123
- - dataset:
4124
- config: default
4125
  name: MTEB SciDocsRR
4126
- revision: d3c5e1fc0b855ab6097bf1cda04dd73947d7caab
4127
- split: test
4128
  type: mteb/scidocs-reranking
 
 
 
4129
  metrics:
4130
  - type: main_score
4131
  value: 89.196009707431
@@ -4145,14 +4154,14 @@ model-index:
4145
  value: 86.38341077184032
4146
  - type: nAUC_mrr_std
4147
  value: 75.38945014727746
4148
- task:
4149
- type: Reranking
4150
- - dataset:
4151
- config: default
4152
  name: MTEB SciFact
4153
- revision: 0228b52cf27578f30900b9e5271d331663a030d7
4154
- split: test
4155
  type: mteb/scifact
 
 
 
4156
  metrics:
4157
  - type: main_score
4158
  value: 80.08999999999999
@@ -4436,14 +4445,14 @@ model-index:
4436
  value: 80.972
4437
  - type: recall_at_5
4438
  value: 89.90599999999999
4439
- task:
4440
- type: Retrieval
4441
- - dataset:
4442
- config: default
4443
  name: MTEB SprintDuplicateQuestions
4444
- revision: d66bd1f72af766a5cc4b0ca5e00c162f89e8cc46
4445
- split: test
4446
  type: mteb/sprintduplicatequestions-pairclassification
 
 
 
4447
  metrics:
4448
  - type: cosine_accuracy
4449
  value: 99.81881188118813
@@ -4525,14 +4534,14 @@ model-index:
4525
  value: 92.59645464025026
4526
  - type: similarity_recall
4527
  value: 88.8
4528
- task:
4529
- type: PairClassification
4530
- - dataset:
4531
- config: default
4532
  name: MTEB StackExchangeClustering
4533
- revision: 6cbc1f7b2bc0622f2e39d2c77fa502909748c259
4534
- split: test
4535
  type: mteb/stackexchange-clustering
 
 
 
4536
  metrics:
4537
  - type: main_score
4538
  value: 80.28558559137414
@@ -4540,14 +4549,14 @@ model-index:
4540
  value: 80.28558559137414
4541
  - type: v_measure_std
4542
  value: 2.795276520287584
4543
- task:
4544
  type: Clustering
4545
- - dataset:
4546
- config: default
4547
  name: MTEB StackExchangeClusteringP2P
4548
- revision: 815ca46b2622cec33ccafc3735d572c266efdb44
4549
- split: test
4550
  type: mteb/stackexchange-clustering-p2p
 
 
 
4551
  metrics:
4552
  - type: main_score
4553
  value: 49.57135582416209
@@ -4555,14 +4564,14 @@ model-index:
4555
  value: 49.57135582416209
4556
  - type: v_measure_std
4557
  value: 1.6414135468423754
4558
- task:
4559
- type: Clustering
4560
- - dataset:
4561
- config: default
4562
  name: MTEB StackOverflowDupQuestions
4563
- revision: e185fbe320c72810689fc5848eb6114e1ef5ec69
4564
- split: test
4565
  type: mteb/stackoverflowdupquestions-reranking
 
 
 
4566
  metrics:
4567
  - type: main_score
4568
  value: 55.253002583598644
@@ -4582,14 +4591,14 @@ model-index:
4582
  value: 10.586310195339053
4583
  - type: nAUC_mrr_std
4584
  value: 8.47326494370076
4585
- task:
4586
- type: Reranking
4587
- - dataset:
4588
- config: default
4589
  name: MTEB SummEval
4590
- revision: cda12ad7615edc362dbf25a00fdd61d3b1eaf93c
4591
- split: test
4592
  type: mteb/summeval
 
 
 
4593
  metrics:
4594
  - type: cosine_pearson
4595
  value: 31.19874648747059
@@ -4605,14 +4614,14 @@ model-index:
4605
  value: 31.19874648747059
4606
  - type: spearman
4607
  value: 31.493550648844863
4608
- task:
4609
- type: Summarization
4610
- - dataset:
4611
- config: default
4612
  name: MTEB TRECCOVID
4613
- revision: bb9466bac8153a0349341eb1b22e06409e78ef4e
4614
- split: test
4615
  type: mteb/trec-covid
 
 
 
4616
  metrics:
4617
  - type: main_score
4618
  value: 85.983
@@ -4896,14 +4905,14 @@ model-index:
4896
  value: 0.7250000000000001
4897
  - type: recall_at_5
4898
  value: 1.1820000000000002
4899
- task:
4900
  type: Retrieval
4901
- - dataset:
4902
- config: default
4903
  name: MTEB Touche2020
4904
- revision: a34f9a33db75fa0cbb21bb5cfc3dae8dc8bec93f
4905
- split: test
4906
  type: mteb/touche2020
 
 
 
4907
  metrics:
4908
  - type: main_score
4909
  value: 29.944
@@ -5187,14 +5196,14 @@ model-index:
5187
  value: 7.383000000000001
5188
  - type: recall_at_5
5189
  value: 11.434
5190
- task:
5191
- type: Retrieval
5192
- - dataset:
5193
- config: default
5194
  name: MTEB ToxicConversationsClassification
5195
- revision: edfaf9da55d3dd50d43143d90c1ac476895ae6de
5196
- split: test
5197
  type: mteb/toxic_conversations_50k
 
 
 
5198
  metrics:
5199
  - type: accuracy
5200
  value: 88.759765625
@@ -5208,14 +5217,14 @@ model-index:
5208
  value: 90.54372649306606
5209
  - type: main_score
5210
  value: 88.759765625
5211
- task:
5212
  type: Classification
5213
- - dataset:
5214
- config: default
5215
  name: MTEB TweetSentimentExtractionClassification
5216
- revision: d604517c81ca91fe16a244d1248fc021f9ecee7a
5217
- split: test
5218
  type: mteb/tweet_sentiment_extraction
 
 
 
5219
  metrics:
5220
  - type: accuracy
5221
  value: 74.8443689869836
@@ -5225,14 +5234,14 @@ model-index:
5225
  value: 74.7369003946243
5226
  - type: main_score
5227
  value: 74.8443689869836
5228
- task:
5229
- type: Classification
5230
- - dataset:
5231
- config: default
5232
  name: MTEB TwentyNewsgroupsClustering
5233
- revision: 6125ec4e24fa026cec8a478383ee943acfbd5449
5234
- split: test
5235
  type: mteb/twentynewsgroups-clustering
 
 
 
5236
  metrics:
5237
  - type: main_score
5238
  value: 61.42918790942448
@@ -5240,14 +5249,14 @@ model-index:
5240
  value: 61.42918790942448
5241
  - type: v_measure_std
5242
  value: 1.0156550098843082
5243
- task:
5244
- type: Clustering
5245
- - dataset:
5246
- config: default
5247
  name: MTEB TwitterSemEval2015
5248
- revision: 70970daeab8776df92f5ea462b6173c0b46fd2d1
5249
- split: test
5250
  type: mteb/twittersemeval2015-pairclassification
 
 
 
5251
  metrics:
5252
  - type: cosine_accuracy
5253
  value: 88.22197055492639
@@ -5329,14 +5338,14 @@ model-index:
5329
  value: 71.64922770303936
5330
  - type: similarity_recall
5331
  value: 75.8839050131926
5332
- task:
5333
  type: PairClassification
5334
- - dataset:
5335
- config: default
5336
  name: MTEB TwitterURLCorpus
5337
- revision: 8b6510b0b1fa4e4c4f879467980e9be563ec1cdf
5338
- split: test
5339
  type: mteb/twitterurlcorpus-pairclassification
 
 
 
5340
  metrics:
5341
  - type: cosine_accuracy
5342
  value: 89.88628866379477
@@ -5418,14 +5427,6 @@ model-index:
5418
  value: 76.93126197063205
5419
  - type: similarity_recall
5420
  value: 83.50015398829689
5421
- task:
5422
- type: PairClassification
5423
- tags:
5424
- - mteb
5425
- - sentence-transformers
5426
- - transformers
5427
- - sentence-similarity
5428
- license: mit
5429
  ---
5430
 
5431
 
 
1
  ---
2
+ tags:
3
+ - mteb
4
+ - sentence-transformers
5
+ - transformers
6
+ - sentence-similarity
7
+ - onnx
8
+ license: mit
9
  model-index:
10
  - name: stella_en_1.5B_v5
11
  results:
12
+ - task:
13
+ type: Classification
14
+ dataset:
15
  name: MTEB AmazonCounterfactualClassification (en)
 
 
16
  type: mteb/amazon_counterfactual
17
+ config: en
18
+ split: test
19
+ revision: e8379541af4e31359cca9fbcf4b00f2671dba205
20
  metrics:
21
  - type: accuracy
22
  value: 92.86567164179104
 
30
  value: 93.13621183004571
31
  - type: main_score
32
  value: 92.86567164179104
33
+ - task:
34
  type: Classification
35
+ dataset:
 
36
  name: MTEB AmazonPolarityClassification
 
 
37
  type: mteb/amazon_polarity
38
+ config: default
39
+ split: test
40
+ revision: e2d317d38cd51312af73b3d32a06d1a08b442046
41
  metrics:
42
  - type: accuracy
43
  value: 97.16485
 
51
  value: 97.16351087403213
52
  - type: main_score
53
  value: 97.16485
54
+ - task:
55
  type: Classification
56
+ dataset:
 
57
  name: MTEB AmazonReviewsClassification (en)
 
 
58
  type: mteb/amazon_reviews_multi
59
+ config: en
60
+ split: test
61
+ revision: 1399c76144fd37290681b995c656ef9b2e06e26d
62
  metrics:
63
  - type: accuracy
64
  value: 59.358
 
68
  value: 59.0264615883114
69
  - type: main_score
70
  value: 59.358
71
+ - task:
72
+ type: Retrieval
73
+ dataset:
 
74
  name: MTEB ArguAna
 
 
75
  type: mteb/arguana
76
+ config: default
77
+ split: test
78
+ revision: c22ab2a51041ffd869aaddef7af8d8215647e41a
79
  metrics:
80
  - type: main_score
81
  value: 65.269
 
359
  value: 67.354
360
  - type: recall_at_5
361
  value: 78.236
362
+ - task:
363
+ type: Clustering
364
+ dataset:
 
365
  name: MTEB ArxivClusteringP2P
 
 
366
  type: mteb/arxiv-clustering-p2p
367
+ config: default
368
+ split: test
369
+ revision: a122ad7f3f0291bf49cc6f4d32aa80929df69d5d
370
  metrics:
371
  - type: main_score
372
  value: 55.437138353189994
 
374
  value: 55.437138353189994
375
  - type: v_measure_std
376
  value: 14.718556601335491
377
+ - task:
378
  type: Clustering
379
+ dataset:
 
380
  name: MTEB ArxivClusteringS2S
 
 
381
  type: mteb/arxiv-clustering-s2s
382
+ config: default
383
+ split: test
384
+ revision: f910caf1a6075f7329cdf8c1a6135696f37dbd53
385
  metrics:
386
  - type: main_score
387
  value: 50.65858459544658
 
389
  value: 50.65858459544658
390
  - type: v_measure_std
391
  value: 14.887033747525146
392
+ - task:
393
+ type: Reranking
394
+ dataset:
 
395
  name: MTEB AskUbuntuDupQuestions
 
 
396
  type: mteb/askubuntudupquestions-reranking
397
+ config: default
398
+ split: test
399
+ revision: 2000358ca161889fa9c082cb41daa8dcfb161a54
400
  metrics:
401
  - type: main_score
402
  value: 67.32597152838535
 
416
  value: 41.64561939958336
417
  - type: nAUC_mrr_std
418
  value: 23.179909345891968
419
+ - task:
420
+ type: STS
421
+ dataset:
 
422
  name: MTEB BIOSSES
 
 
423
  type: mteb/biosses-sts
424
+ config: default
425
+ split: test
426
+ revision: d3fb88f8f02e40887cd149695127462bbcf29b4a
427
  metrics:
428
  - type: cosine_pearson
429
  value: 85.790820496042
 
443
  value: 85.790820496042
444
  - type: spearman
445
  value: 83.10731534330517
446
+ - task:
447
+ type: Classification
448
+ dataset:
 
449
  name: MTEB Banking77Classification
 
 
450
  type: mteb/banking77
451
+ config: default
452
+ split: test
453
+ revision: 0fd18e25b25c072e09e0d92ab615fda904d66300
454
  metrics:
455
  - type: accuracy
456
  value: 89.78896103896105
 
460
  value: 89.76107366333488
461
  - type: main_score
462
  value: 89.78896103896105
463
+ - task:
464
+ type: Clustering
465
+ dataset:
 
466
  name: MTEB BiorxivClusteringP2P
 
 
467
  type: mteb/biorxiv-clustering-p2p
468
+ config: default
469
+ split: test
470
+ revision: 65b79d1d13f80053f67aca9498d9402c2d9f1f40
471
  metrics:
472
  - type: main_score
473
  value: 50.68092296236376
 
475
  value: 50.68092296236376
476
  - type: v_measure_std
477
  value: 0.7832640983085436
478
+ - task:
479
  type: Clustering
480
+ dataset:
 
481
  name: MTEB BiorxivClusteringS2S
 
 
482
  type: mteb/biorxiv-clustering-s2s
483
+ config: default
484
+ split: test
485
+ revision: 258694dd0231531bc1fd9de6ceb52a0853c6d908
486
  metrics:
487
  - type: main_score
488
  value: 46.86629236732983
 
490
  value: 46.86629236732983
491
  - type: v_measure_std
492
  value: 0.8784322236350974
493
+ - task:
494
+ type: Retrieval
495
+ dataset:
 
496
  name: MTEB CQADupstackRetrieval
 
 
497
  type: mteb/cqadupstack
498
+ config: default
499
+ split: test
500
+ revision: 4ffe81d471b1924886b33c7567bfb200e9eec5c4
501
  metrics:
502
  - type: main_score
503
  value: 47.74883333333334
 
781
  value: 46.01841666666666
782
  - type: recall_at_5
783
  value: 52.482416666666666
784
+ - task:
785
  type: Retrieval
786
+ dataset:
 
787
  name: MTEB ClimateFEVER
 
 
788
  type: mteb/climate-fever
789
+ config: default
790
+ split: test
791
+ revision: 47f2ac6acb640fc46020b02a5b59fdda04d39380
792
  metrics:
793
  - type: main_score
794
  value: 46.113
 
1072
  value: 35.150999999999996
1073
  - type: recall_at_5
1074
  value: 42.748000000000005
1075
+ - task:
1076
  type: Retrieval
1077
+ dataset:
 
1078
  name: MTEB DBPedia
 
 
1079
  type: mteb/dbpedia
1080
+ config: default
1081
+ split: test
1082
+ revision: c0f706b76e590d620bd6618b3ca8efdd34e2d659
1083
  metrics:
1084
  - type: main_score
1085
  value: 52.276999999999994
 
1363
  value: 17.876
1364
  - type: recall_at_5
1365
  value: 22.536
1366
+ - task:
1367
+ type: Classification
1368
+ dataset:
 
1369
  name: MTEB EmotionClassification
 
 
1370
  type: mteb/emotion
1371
+ config: default
1372
+ split: test
1373
+ revision: 4f58c6b202a23cf9a4da393831edf4f9183cad37
1374
  metrics:
1375
  - type: accuracy
1376
  value: 84.29499999999999
 
1380
  value: 84.96026012933847
1381
  - type: main_score
1382
  value: 84.29499999999999
1383
+ - task:
1384
+ type: Retrieval
1385
+ dataset:
 
1386
  name: MTEB FEVER
 
 
1387
  type: mteb/fever
1388
+ config: default
1389
+ split: test
1390
+ revision: bea83ef9e8fb933d90a2f1d5515737465d613e12
1391
  metrics:
1392
  - type: main_score
1393
  value: 94.83200000000001
 
1671
  value: 95.069
1672
  - type: recall_at_5
1673
  value: 96.177
1674
+ - task:
1675
  type: Retrieval
1676
+ dataset:
 
1677
  name: MTEB FiQA2018
 
 
1678
  type: mteb/fiqa
1679
+ config: default
1680
+ split: test
1681
+ revision: 27a168819829fe9bcd655c2df245fb19452e8e06
1682
  metrics:
1683
  - type: main_score
1684
  value: 60.480000000000004
 
1962
  value: 50.221000000000004
1963
  - type: recall_at_5
1964
  value: 58.209999999999994
1965
+ - task:
1966
  type: Retrieval
1967
+ dataset:
 
1968
  name: MTEB HotpotQA
 
 
1969
  type: mteb/hotpotqa
1970
+ config: default
1971
+ split: test
1972
+ revision: ab518f4d6fcca38d87c25209f94beba119d02014
1973
  metrics:
1974
  - type: main_score
1975
  value: 76.67399999999999
 
2253
  value: 68.879
2254
  - type: recall_at_5
2255
  value: 73.896
2256
+ - task:
2257
+ type: Classification
2258
+ dataset:
 
2259
  name: MTEB ImdbClassification
 
 
2260
  type: mteb/imdb
2261
+ config: default
2262
+ split: test
2263
+ revision: 3d86128a09e091d6018b6d26cad27f2739fc2db7
2264
  metrics:
2265
  - type: accuracy
2266
  value: 96.6608
 
2274
  value: 96.66029695623423
2275
  - type: main_score
2276
  value: 96.6608
2277
+ - task:
2278
+ type: Retrieval
2279
+ dataset:
 
2280
  name: MTEB MSMARCO
 
 
2281
  type: mteb/msmarco
2282
+ config: default
2283
+ split: dev
2284
+ revision: c5a29a104738b98a9e76336939199e264163d4a0
2285
  metrics:
2286
  - type: main_score
2287
  value: 45.217
 
2565
  value: 45.535
2566
  - type: recall_at_5
2567
  value: 55.394
2568
+ - task:
2569
+ type: Classification
2570
+ dataset:
 
2571
  name: MTEB MTOPDomainClassification (en)
 
 
2572
  type: mteb/mtop_domain
2573
+ config: en
2574
+ split: test
2575
+ revision: d80d48c1eb48d3562165c59d59d0034df9fff0bf
2576
  metrics:
2577
  - type: accuracy
2578
  value: 99.01276789785682
 
2582
  value: 99.01406884928141
2583
  - type: main_score
2584
  value: 99.01276789785682
2585
+ - task:
2586
  type: Classification
2587
+ dataset:
 
2588
  name: MTEB MTOPIntentClassification (en)
 
 
2589
  type: mteb/mtop_intent
2590
+ config: en
2591
+ split: test
2592
+ revision: ae001d0e6b1228650b7bd1c2c65fb50ad11a8aba
2593
  metrics:
2594
  - type: accuracy
2595
  value: 92.78385772913816
 
2599
  value: 93.90424147486428
2600
  - type: main_score
2601
  value: 92.78385772913816
2602
+ - task:
2603
  type: Classification
2604
+ dataset:
 
2605
  name: MTEB MassiveIntentClassification (en)
 
 
2606
  type: mteb/amazon_massive_intent
2607
+ config: en
2608
+ split: test
2609
+ revision: 4672e20407010da34463acc759c162ca9734bca6
2610
  metrics:
2611
  - type: accuracy
2612
  value: 85.83053127101546
 
2616
  value: 85.81759723866098
2617
  - type: main_score
2618
  value: 85.83053127101546
2619
+ - task:
2620
  type: Classification
2621
+ dataset:
 
2622
  name: MTEB MassiveScenarioClassification (en)
 
 
2623
  type: mteb/amazon_massive_scenario
2624
+ config: en
2625
+ split: test
2626
+ revision: fad2c6e8459f9e1c45d9315f4953d921437d70f8
2627
  metrics:
2628
  - type: accuracy
2629
  value: 90.19838601210489
 
2633
  value: 90.11422965504119
2634
  - type: main_score
2635
  value: 90.19838601210489
2636
+ - task:
2637
+ type: Clustering
2638
+ dataset:
 
2639
  name: MTEB MedrxivClusteringP2P
 
 
2640
  type: mteb/medrxiv-clustering-p2p
2641
+ config: default
2642
+ split: test
2643
+ revision: e7a26af6f3ae46b30dde8737f02c07b1505bcc73
2644
  metrics:
2645
  - type: main_score
2646
  value: 46.866746897607094
 
2648
  value: 46.866746897607094
2649
  - type: v_measure_std
2650
  value: 1.0966477896919726
2651
+ - task:
2652
  type: Clustering
2653
+ dataset:
 
2654
  name: MTEB MedrxivClusteringS2S
 
 
2655
  type: mteb/medrxiv-clustering-s2s
2656
+ config: default
2657
+ split: test
2658
+ revision: 35191c8c0dca72d8ff3efcd72aa802307d469663
2659
  metrics:
2660
  - type: main_score
2661
  value: 44.6538827415503
 
2663
  value: 44.6538827415503
2664
  - type: v_measure_std
2665
  value: 1.1649569936599116
2666
+ - task:
2667
+ type: Reranking
2668
+ dataset:
 
2669
  name: MTEB MindSmallReranking
 
 
2670
  type: mteb/mind_small
2671
+ config: default
2672
+ split: test
2673
+ revision: 59042f120c80e8afa9cdbb224f67076cec0fc9a7
2674
  metrics:
2675
  - type: main_score
2676
  value: 33.05449204940555
 
2690
  value: -15.304687384645769
2691
  - type: nAUC_mrr_std
2692
  value: -0.519919931348978
2693
+ - task:
2694
+ type: Retrieval
2695
+ dataset:
 
2696
  name: MTEB NFCorpus
 
 
2697
  type: mteb/nfcorpus
2698
+ config: default
2699
+ split: test
2700
+ revision: ec0fa4fe99da2ff19ca1214b7966684033a58814
2701
  metrics:
2702
  - type: main_score
2703
  value: 41.998000000000005
 
2981
  value: 13.267999999999999
2982
  - type: recall_at_5
2983
  value: 16.141
2984
+ - task:
2985
  type: Retrieval
2986
+ dataset:
 
2987
  name: MTEB NQ
 
 
2988
  type: mteb/nq
2989
+ config: default
2990
+ split: test
2991
+ revision: b774495ed302d8c44a3a7ea25c90dbce03968f31
2992
  metrics:
2993
  - type: main_score
2994
  value: 71.8
 
3272
  value: 74.394
3273
  - type: recall_at_5
3274
  value: 82.711
3275
+ - task:
3276
  type: Retrieval
3277
+ dataset:
 
3278
  name: MTEB QuoraRetrieval
 
 
3279
  type: mteb/quora
3280
+ config: default
3281
+ split: test
3282
+ revision: e4e08e0b7dbe3c8700f0daef558ff32256715259
3283
  metrics:
3284
  - type: main_score
3285
  value: 90.025
 
3563
  value: 89.276
3564
  - type: recall_at_5
3565
  value: 93.46
3566
+ - task:
3567
+ type: Clustering
3568
+ dataset:
 
3569
  name: MTEB RedditClustering
 
 
3570
  type: mteb/reddit-clustering
3571
+ config: default
3572
+ split: test
3573
+ revision: 24640382cdbf8abc73003fb0fa6d111a705499eb
3574
  metrics:
3575
  - type: main_score
3576
  value: 72.86492101891123
 
3578
  value: 72.86492101891123
3579
  - type: v_measure_std
3580
  value: 2.778711445144635
3581
+ - task:
3582
  type: Clustering
3583
+ dataset:
 
3584
  name: MTEB RedditClusteringP2P
 
 
3585
  type: mteb/reddit-clustering-p2p
3586
+ config: default
3587
+ split: test
3588
+ revision: 385e3cb46b4cfa89021f56c4380204149d0efe33
3589
  metrics:
3590
  - type: main_score
3591
  value: 75.27316726548479
 
3593
  value: 75.27316726548479
3594
  - type: v_measure_std
3595
  value: 8.87871936725338
3596
+ - task:
3597
+ type: Retrieval
3598
+ dataset:
 
3599
  name: MTEB SCIDOCS
 
 
3600
  type: mteb/scidocs
3601
+ config: default
3602
+ split: test
3603
+ revision: f8c2fcf00f625baaa80f62ec5bd9e1fff3b8ae88
3604
  metrics:
3605
  - type: main_score
3606
  value: 26.638
 
3884
  value: 14.127999999999998
3885
  - type: recall_at_5
3886
  value: 19.673
3887
+ - task:
3888
+ type: STS
3889
+ dataset:
 
3890
  name: MTEB SICK-R
 
 
3891
  type: mteb/sickr-sts
3892
+ config: default
3893
+ split: test
3894
+ revision: 20a6d6f312dd54037fe07a32d58e5e168867909d
3895
  metrics:
3896
  - type: cosine_pearson
3897
  value: 86.86608529160739
 
3911
  value: 86.86608529160739
3912
  - type: spearman
3913
  value: 82.88625166203383
3914
+ - task:
3915
  type: STS
3916
+ dataset:
 
3917
  name: MTEB STS12
 
 
3918
  type: mteb/sts12-sts
3919
+ config: default
3920
+ split: test
3921
+ revision: a0d554a64d88156834ff5ae9920b964011b16384
3922
  metrics:
3923
  - type: cosine_pearson
3924
  value: 87.0445014940449
 
3938
  value: 87.0445014940449
3939
  - type: spearman
3940
  value: 80.0880365116599
3941
+ - task:
3942
  type: STS
3943
+ dataset:
 
3944
  name: MTEB STS13
 
 
3945
  type: mteb/sts13-sts
3946
+ config: default
3947
+ split: test
3948
+ revision: 7e90230a92c190f1bf69ae9002b8cea547a64cca
3949
  metrics:
3950
  - type: cosine_pearson
3951
  value: 89.33900828959968
 
3965
  value: 89.33900828959968
3966
  - type: spearman
3967
  value: 89.68256358526733
3968
+ - task:
3969
  type: STS
3970
+ dataset:
 
3971
  name: MTEB STS14
 
 
3972
  type: mteb/sts14-sts
3973
+ config: default
3974
+ split: test
3975
+ revision: 6031580fec1f6af667f0bd2da0a551cf4f0b2375
3976
  metrics:
3977
  - type: cosine_pearson
3978
  value: 86.42029843639123
 
3992
  value: 86.42029843639123
3993
  - type: spearman
3994
  value: 85.0707889220723
3995
+ - task:
3996
  type: STS
3997
+ dataset:
 
3998
  name: MTEB STS15
 
 
3999
  type: mteb/sts15-sts
4000
+ config: default
4001
+ split: test
4002
+ revision: ae752c7c21bf194d8b67fd573edf7ae58183cbe3
4003
  metrics:
4004
  - type: cosine_pearson
4005
  value: 88.3660081271444
 
4019
  value: 88.3660081271444
4020
  - type: spearman
4021
  value: 89.39375083609528
4022
+ - task:
4023
  type: STS
4024
+ dataset:
 
4025
  name: MTEB STS16
 
 
4026
  type: mteb/sts16-sts
4027
+ config: default
4028
+ split: test
4029
+ revision: 4d8694f8f0e0100860b497b999b3dbed754a0513
4030
  metrics:
4031
  - type: cosine_pearson
4032
  value: 85.60708247171874
 
4046
  value: 85.60708247171874
4047
  - type: spearman
4048
  value: 87.15234952832193
4049
+ - task:
4050
  type: STS
4051
+ dataset:
 
4052
  name: MTEB STS17 (en-en)
 
 
4053
  type: mteb/sts17-crosslingual-sts
4054
+ config: en-en
4055
+ split: test
4056
+ revision: faeb762787bd10488a50c8b5be4a3b82e411949c
4057
  metrics:
4058
  - type: cosine_pearson
4059
  value: 91.25898556808458
 
4073
  value: 91.25898556808458
4074
  - type: spearman
4075
  value: 91.35372390581641
4076
+ - task:
4077
  type: STS
4078
+ dataset:
 
4079
  name: MTEB STS22 (en)
 
 
4080
  type: mteb/sts22-crosslingual-sts
4081
+ config: en
4082
+ split: test
4083
+ revision: de9d86b3b84231dc21f76c7b7af1f28e2f57f6e3
4084
  metrics:
4085
  - type: cosine_pearson
4086
  value: 67.61637111515797
 
4100
  value: 67.61637111515797
4101
  - type: spearman
4102
  value: 68.10379096526697
4103
+ - task:
4104
  type: STS
4105
+ dataset:
 
4106
  name: MTEB STSBenchmark
 
 
4107
  type: mteb/stsbenchmark-sts
4108
+ config: default
4109
+ split: test
4110
+ revision: b0fddb56ed78048fa8b90373c8a3cfc37b684831
4111
  metrics:
4112
  - type: cosine_pearson
4113
  value: 87.81592853782297
 
4127
  value: 87.81592853782297
4128
  - type: spearman
4129
  value: 88.2302550329183
4130
+ - task:
4131
+ type: Reranking
4132
+ dataset:
 
4133
  name: MTEB SciDocsRR
 
 
4134
  type: mteb/scidocs-reranking
4135
+ config: default
4136
+ split: test
4137
+ revision: d3c5e1fc0b855ab6097bf1cda04dd73947d7caab
4138
  metrics:
4139
  - type: main_score
4140
  value: 89.196009707431
 
4154
  value: 86.38341077184032
4155
  - type: nAUC_mrr_std
4156
  value: 75.38945014727746
4157
+ - task:
4158
+ type: Retrieval
4159
+ dataset:
 
4160
  name: MTEB SciFact
 
 
4161
  type: mteb/scifact
4162
+ config: default
4163
+ split: test
4164
+ revision: 0228b52cf27578f30900b9e5271d331663a030d7
4165
  metrics:
4166
  - type: main_score
4167
  value: 80.08999999999999
 
4445
  value: 80.972
4446
  - type: recall_at_5
4447
  value: 89.90599999999999
4448
+ - task:
4449
+ type: PairClassification
4450
+ dataset:
 
4451
  name: MTEB SprintDuplicateQuestions
 
 
4452
  type: mteb/sprintduplicatequestions-pairclassification
4453
+ config: default
4454
+ split: test
4455
+ revision: d66bd1f72af766a5cc4b0ca5e00c162f89e8cc46
4456
  metrics:
4457
  - type: cosine_accuracy
4458
  value: 99.81881188118813
 
4534
  value: 92.59645464025026
4535
  - type: similarity_recall
4536
  value: 88.8
4537
+ - task:
4538
+ type: Clustering
4539
+ dataset:
 
4540
  name: MTEB StackExchangeClustering
 
 
4541
  type: mteb/stackexchange-clustering
4542
+ config: default
4543
+ split: test
4544
+ revision: 6cbc1f7b2bc0622f2e39d2c77fa502909748c259
4545
  metrics:
4546
  - type: main_score
4547
  value: 80.28558559137414
 
4549
  value: 80.28558559137414
4550
  - type: v_measure_std
4551
  value: 2.795276520287584
4552
+ - task:
4553
  type: Clustering
4554
+ dataset:
 
4555
  name: MTEB StackExchangeClusteringP2P
 
 
4556
  type: mteb/stackexchange-clustering-p2p
4557
+ config: default
4558
+ split: test
4559
+ revision: 815ca46b2622cec33ccafc3735d572c266efdb44
4560
  metrics:
4561
  - type: main_score
4562
  value: 49.57135582416209
 
4564
  value: 49.57135582416209
4565
  - type: v_measure_std
4566
  value: 1.6414135468423754
4567
+ - task:
4568
+ type: Reranking
4569
+ dataset:
 
4570
  name: MTEB StackOverflowDupQuestions
 
 
4571
  type: mteb/stackoverflowdupquestions-reranking
4572
+ config: default
4573
+ split: test
4574
+ revision: e185fbe320c72810689fc5848eb6114e1ef5ec69
4575
  metrics:
4576
  - type: main_score
4577
  value: 55.253002583598644
 
4591
  value: 10.586310195339053
4592
  - type: nAUC_mrr_std
4593
  value: 8.47326494370076
4594
+ - task:
4595
+ type: Summarization
4596
+ dataset:
 
4597
  name: MTEB SummEval
 
 
4598
  type: mteb/summeval
4599
+ config: default
4600
+ split: test
4601
+ revision: cda12ad7615edc362dbf25a00fdd61d3b1eaf93c
4602
  metrics:
4603
  - type: cosine_pearson
4604
  value: 31.19874648747059
 
4614
  value: 31.19874648747059
4615
  - type: spearman
4616
  value: 31.493550648844863
4617
+ - task:
4618
+ type: Retrieval
4619
+ dataset:
 
4620
  name: MTEB TRECCOVID
 
 
4621
  type: mteb/trec-covid
4622
+ config: default
4623
+ split: test
4624
+ revision: bb9466bac8153a0349341eb1b22e06409e78ef4e
4625
  metrics:
4626
  - type: main_score
4627
  value: 85.983
 
4905
  value: 0.7250000000000001
4906
  - type: recall_at_5
4907
  value: 1.1820000000000002
4908
+ - task:
4909
  type: Retrieval
4910
+ dataset:
 
4911
  name: MTEB Touche2020
 
 
4912
  type: mteb/touche2020
4913
+ config: default
4914
+ split: test
4915
+ revision: a34f9a33db75fa0cbb21bb5cfc3dae8dc8bec93f
4916
  metrics:
4917
  - type: main_score
4918
  value: 29.944
 
5196
  value: 7.383000000000001
5197
  - type: recall_at_5
5198
  value: 11.434
5199
+ - task:
5200
+ type: Classification
5201
+ dataset:
 
5202
  name: MTEB ToxicConversationsClassification
 
 
5203
  type: mteb/toxic_conversations_50k
5204
+ config: default
5205
+ split: test
5206
+ revision: edfaf9da55d3dd50d43143d90c1ac476895ae6de
5207
  metrics:
5208
  - type: accuracy
5209
  value: 88.759765625
 
5217
  value: 90.54372649306606
5218
  - type: main_score
5219
  value: 88.759765625
5220
+ - task:
5221
  type: Classification
5222
+ dataset:
 
5223
  name: MTEB TweetSentimentExtractionClassification
 
 
5224
  type: mteb/tweet_sentiment_extraction
5225
+ config: default
5226
+ split: test
5227
+ revision: d604517c81ca91fe16a244d1248fc021f9ecee7a
5228
  metrics:
5229
  - type: accuracy
5230
  value: 74.8443689869836
 
5234
  value: 74.7369003946243
5235
  - type: main_score
5236
  value: 74.8443689869836
5237
+ - task:
5238
+ type: Clustering
5239
+ dataset:
 
5240
  name: MTEB TwentyNewsgroupsClustering
 
 
5241
  type: mteb/twentynewsgroups-clustering
5242
+ config: default
5243
+ split: test
5244
+ revision: 6125ec4e24fa026cec8a478383ee943acfbd5449
5245
  metrics:
5246
  - type: main_score
5247
  value: 61.42918790942448
 
5249
  value: 61.42918790942448
5250
  - type: v_measure_std
5251
  value: 1.0156550098843082
5252
+ - task:
5253
+ type: PairClassification
5254
+ dataset:
 
5255
  name: MTEB TwitterSemEval2015
 
 
5256
  type: mteb/twittersemeval2015-pairclassification
5257
+ config: default
5258
+ split: test
5259
+ revision: 70970daeab8776df92f5ea462b6173c0b46fd2d1
5260
  metrics:
5261
  - type: cosine_accuracy
5262
  value: 88.22197055492639
 
5338
  value: 71.64922770303936
5339
  - type: similarity_recall
5340
  value: 75.8839050131926
5341
+ - task:
5342
  type: PairClassification
5343
+ dataset:
 
5344
  name: MTEB TwitterURLCorpus
 
 
5345
  type: mteb/twitterurlcorpus-pairclassification
5346
+ config: default
5347
+ split: test
5348
+ revision: 8b6510b0b1fa4e4c4f879467980e9be563ec1cdf
5349
  metrics:
5350
  - type: cosine_accuracy
5351
  value: 89.88628866379477
 
5427
  value: 76.93126197063205
5428
  - type: similarity_recall
5429
  value: 83.50015398829689
 
 
 
 
 
 
 
 
5430
  ---
5431
 
5432
 
onnx/added_tokens.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "<|endoftext|>": 151643,
3
+ "<|im_end|>": 151645,
4
+ "<|im_start|>": 151644
5
+ }
onnx/config.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_attn_implementation_autoset": true,
3
+ "architectures": [
4
+ "Qwen2ForCausalLM"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "auto_map": {
8
+ "AutoModel": "NovaSearch/stella_en_1.5B_v5--modeling_qwen.Qwen2Model",
9
+ "AutoModelForCausalLM": "NovaSearch/stella_en_1.5B_v5--modeling_qwen.Qwen2ForCausalLM",
10
+ "AutoModelForSequenceClassification": "NovaSearch/stella_en_1.5B_v5--modeling_qwen.Qwen2ForSequenceClassification"
11
+ },
12
+ "bos_token_id": 151643,
13
+ "eos_token_id": 151643,
14
+ "export_model_type": "transformer",
15
+ "hidden_act": "silu",
16
+ "hidden_size": 1536,
17
+ "initializer_range": 0.02,
18
+ "intermediate_size": 8960,
19
+ "max_position_embeddings": 131072,
20
+ "max_window_layers": 21,
21
+ "model_type": "qwen2",
22
+ "num_attention_heads": 12,
23
+ "num_hidden_layers": 28,
24
+ "num_key_value_heads": 2,
25
+ "rms_norm_eps": 1e-06,
26
+ "rope_scaling": null,
27
+ "rope_theta": 1000000.0,
28
+ "sliding_window": 131072,
29
+ "tie_word_embeddings": false,
30
+ "torch_dtype": "float32",
31
+ "transformers_version": "4.51.3",
32
+ "use_cache": true,
33
+ "use_sliding_window": false,
34
+ "vocab_size": 151646
35
+ }
onnx/merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
onnx/model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8b8d12c8210ae19b00bbdca6ddfe3d70da0d46312c72bcfa1fd6e3707cfdd7d2
3
- size 874851
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b44c618d7f278c8b171a78c6635b844caa144556b46d144ecaaac8562f6f927
3
+ size 1430611
onnx/model.onnx_data CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4d9d0ac35b704186bd6bf7d969ebccc7929e0cb13acae9f088a061e433141f29
3
- size 6313588736
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b96b4485d9715a6efb678336ed8069976eca6d7b85f05188f3142ffb0561f667
3
+ size 6179371008
onnx/special_tokens_map.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<|im_start|>",
4
+ "<|im_end|>"
5
+ ],
6
+ "eos_token": {
7
+ "content": "<|endoftext|>",
8
+ "lstrip": false,
9
+ "normalized": false,
10
+ "rstrip": false,
11
+ "single_word": false
12
+ },
13
+ "pad_token": {
14
+ "content": "<|endoftext|>",
15
+ "lstrip": false,
16
+ "normalized": false,
17
+ "rstrip": false,
18
+ "single_word": false
19
+ }
20
+ }
onnx/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8372feaa064372d176aff57e8f1e64f194814bb074519104f64c66a2825f091
3
+ size 11419037
onnx/tokenizer_config.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_eos_token": true,
3
+ "add_prefix_space": false,
4
+ "added_tokens_decoder": {
5
+ "151643": {
6
+ "content": "<|endoftext|>",
7
+ "lstrip": false,
8
+ "normalized": false,
9
+ "rstrip": false,
10
+ "single_word": false,
11
+ "special": true
12
+ },
13
+ "151644": {
14
+ "content": "<|im_start|>",
15
+ "lstrip": false,
16
+ "normalized": false,
17
+ "rstrip": false,
18
+ "single_word": false,
19
+ "special": true
20
+ },
21
+ "151645": {
22
+ "content": "<|im_end|>",
23
+ "lstrip": false,
24
+ "normalized": false,
25
+ "rstrip": false,
26
+ "single_word": false,
27
+ "special": true
28
+ }
29
+ },
30
+ "additional_special_tokens": [
31
+ "<|im_start|>",
32
+ "<|im_end|>"
33
+ ],
34
+ "auto_map": {
35
+ "AutoTokenizer": [
36
+ "NovaSearch/stella_en_1.5B_v5--tokenization_qwen.Qwen2Tokenizer",
37
+ "NovaSearch/stella_en_1.5B_v5--tokenization_qwen.Qwen2TokenizerFast"
38
+ ]
39
+ },
40
+ "bos_token": null,
41
+ "chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
42
+ "clean_up_tokenization_spaces": false,
43
+ "eos_token": "<|endoftext|>",
44
+ "errors": "replace",
45
+ "extra_special_tokens": {},
46
+ "model_max_length": 32768,
47
+ "pad_token": "<|endoftext|>",
48
+ "split_special_tokens": false,
49
+ "tokenizer_class": "Qwen2Tokenizer",
50
+ "unk_token": null
51
+ }
onnx/vocab.json ADDED
The diff for this file is too large to render. See raw diff