Adding ONNX file of this model

#48
by abukhoyer - opened
.gitattributes CHANGED
@@ -35,3 +35,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  onnx/model.onnx_data filter=lfs diff=lfs merge=lfs -text
37
  onnx/model_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
 
 
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  onnx/model.onnx_data filter=lfs diff=lfs merge=lfs -text
37
  onnx/model_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
38
+ onnx/tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
@@ -1,13 +1,22 @@
1
  ---
 
 
 
 
 
 
 
2
  model-index:
3
  - name: stella_en_1.5B_v5
4
  results:
5
- - dataset:
6
- config: en
 
7
  name: MTEB AmazonCounterfactualClassification (en)
8
- revision: e8379541af4e31359cca9fbcf4b00f2671dba205
9
- split: test
10
  type: mteb/amazon_counterfactual
 
 
 
11
  metrics:
12
  - type: accuracy
13
  value: 92.86567164179104
@@ -21,14 +30,14 @@ model-index:
21
  value: 93.13621183004571
22
  - type: main_score
23
  value: 92.86567164179104
24
- task:
25
  type: Classification
26
- - dataset:
27
- config: default
28
  name: MTEB AmazonPolarityClassification
29
- revision: e2d317d38cd51312af73b3d32a06d1a08b442046
30
- split: test
31
  type: mteb/amazon_polarity
 
 
 
32
  metrics:
33
  - type: accuracy
34
  value: 97.16485
@@ -42,14 +51,14 @@ model-index:
42
  value: 97.16351087403213
43
  - type: main_score
44
  value: 97.16485
45
- task:
46
  type: Classification
47
- - dataset:
48
- config: en
49
  name: MTEB AmazonReviewsClassification (en)
50
- revision: 1399c76144fd37290681b995c656ef9b2e06e26d
51
- split: test
52
  type: mteb/amazon_reviews_multi
 
 
 
53
  metrics:
54
  - type: accuracy
55
  value: 59.358
@@ -59,14 +68,14 @@ model-index:
59
  value: 59.0264615883114
60
  - type: main_score
61
  value: 59.358
62
- task:
63
- type: Classification
64
- - dataset:
65
- config: default
66
  name: MTEB ArguAna
67
- revision: c22ab2a51041ffd869aaddef7af8d8215647e41a
68
- split: test
69
  type: mteb/arguana
 
 
 
70
  metrics:
71
  - type: main_score
72
  value: 65.269
@@ -350,14 +359,14 @@ model-index:
350
  value: 67.354
351
  - type: recall_at_5
352
  value: 78.236
353
- task:
354
- type: Retrieval
355
- - dataset:
356
- config: default
357
  name: MTEB ArxivClusteringP2P
358
- revision: a122ad7f3f0291bf49cc6f4d32aa80929df69d5d
359
- split: test
360
  type: mteb/arxiv-clustering-p2p
 
 
 
361
  metrics:
362
  - type: main_score
363
  value: 55.437138353189994
@@ -365,14 +374,14 @@ model-index:
365
  value: 55.437138353189994
366
  - type: v_measure_std
367
  value: 14.718556601335491
368
- task:
369
  type: Clustering
370
- - dataset:
371
- config: default
372
  name: MTEB ArxivClusteringS2S
373
- revision: f910caf1a6075f7329cdf8c1a6135696f37dbd53
374
- split: test
375
  type: mteb/arxiv-clustering-s2s
 
 
 
376
  metrics:
377
  - type: main_score
378
  value: 50.65858459544658
@@ -380,14 +389,14 @@ model-index:
380
  value: 50.65858459544658
381
  - type: v_measure_std
382
  value: 14.887033747525146
383
- task:
384
- type: Clustering
385
- - dataset:
386
- config: default
387
  name: MTEB AskUbuntuDupQuestions
388
- revision: 2000358ca161889fa9c082cb41daa8dcfb161a54
389
- split: test
390
  type: mteb/askubuntudupquestions-reranking
 
 
 
391
  metrics:
392
  - type: main_score
393
  value: 67.32597152838535
@@ -407,14 +416,14 @@ model-index:
407
  value: 41.64561939958336
408
  - type: nAUC_mrr_std
409
  value: 23.179909345891968
410
- task:
411
- type: Reranking
412
- - dataset:
413
- config: default
414
  name: MTEB BIOSSES
415
- revision: d3fb88f8f02e40887cd149695127462bbcf29b4a
416
- split: test
417
  type: mteb/biosses-sts
 
 
 
418
  metrics:
419
  - type: cosine_pearson
420
  value: 85.790820496042
@@ -434,14 +443,14 @@ model-index:
434
  value: 85.790820496042
435
  - type: spearman
436
  value: 83.10731534330517
437
- task:
438
- type: STS
439
- - dataset:
440
- config: default
441
  name: MTEB Banking77Classification
442
- revision: 0fd18e25b25c072e09e0d92ab615fda904d66300
443
- split: test
444
  type: mteb/banking77
 
 
 
445
  metrics:
446
  - type: accuracy
447
  value: 89.78896103896105
@@ -451,14 +460,14 @@ model-index:
451
  value: 89.76107366333488
452
  - type: main_score
453
  value: 89.78896103896105
454
- task:
455
- type: Classification
456
- - dataset:
457
- config: default
458
  name: MTEB BiorxivClusteringP2P
459
- revision: 65b79d1d13f80053f67aca9498d9402c2d9f1f40
460
- split: test
461
  type: mteb/biorxiv-clustering-p2p
 
 
 
462
  metrics:
463
  - type: main_score
464
  value: 50.68092296236376
@@ -466,14 +475,14 @@ model-index:
466
  value: 50.68092296236376
467
  - type: v_measure_std
468
  value: 0.7832640983085436
469
- task:
470
  type: Clustering
471
- - dataset:
472
- config: default
473
  name: MTEB BiorxivClusteringS2S
474
- revision: 258694dd0231531bc1fd9de6ceb52a0853c6d908
475
- split: test
476
  type: mteb/biorxiv-clustering-s2s
 
 
 
477
  metrics:
478
  - type: main_score
479
  value: 46.86629236732983
@@ -481,14 +490,14 @@ model-index:
481
  value: 46.86629236732983
482
  - type: v_measure_std
483
  value: 0.8784322236350974
484
- task:
485
- type: Clustering
486
- - dataset:
487
- config: default
488
  name: MTEB CQADupstackRetrieval
489
- revision: 4ffe81d471b1924886b33c7567bfb200e9eec5c4
490
- split: test
491
  type: mteb/cqadupstack
 
 
 
492
  metrics:
493
  - type: main_score
494
  value: 47.74883333333334
@@ -772,14 +781,14 @@ model-index:
772
  value: 46.01841666666666
773
  - type: recall_at_5
774
  value: 52.482416666666666
775
- task:
776
  type: Retrieval
777
- - dataset:
778
- config: default
779
  name: MTEB ClimateFEVER
780
- revision: 47f2ac6acb640fc46020b02a5b59fdda04d39380
781
- split: test
782
  type: mteb/climate-fever
 
 
 
783
  metrics:
784
  - type: main_score
785
  value: 46.113
@@ -1063,14 +1072,14 @@ model-index:
1063
  value: 35.150999999999996
1064
  - type: recall_at_5
1065
  value: 42.748000000000005
1066
- task:
1067
  type: Retrieval
1068
- - dataset:
1069
- config: default
1070
  name: MTEB DBPedia
1071
- revision: c0f706b76e590d620bd6618b3ca8efdd34e2d659
1072
- split: test
1073
  type: mteb/dbpedia
 
 
 
1074
  metrics:
1075
  - type: main_score
1076
  value: 52.276999999999994
@@ -1354,14 +1363,14 @@ model-index:
1354
  value: 17.876
1355
  - type: recall_at_5
1356
  value: 22.536
1357
- task:
1358
- type: Retrieval
1359
- - dataset:
1360
- config: default
1361
  name: MTEB EmotionClassification
1362
- revision: 4f58c6b202a23cf9a4da393831edf4f9183cad37
1363
- split: test
1364
  type: mteb/emotion
 
 
 
1365
  metrics:
1366
  - type: accuracy
1367
  value: 84.29499999999999
@@ -1371,14 +1380,14 @@ model-index:
1371
  value: 84.96026012933847
1372
  - type: main_score
1373
  value: 84.29499999999999
1374
- task:
1375
- type: Classification
1376
- - dataset:
1377
- config: default
1378
  name: MTEB FEVER
1379
- revision: bea83ef9e8fb933d90a2f1d5515737465d613e12
1380
- split: test
1381
  type: mteb/fever
 
 
 
1382
  metrics:
1383
  - type: main_score
1384
  value: 94.83200000000001
@@ -1662,14 +1671,14 @@ model-index:
1662
  value: 95.069
1663
  - type: recall_at_5
1664
  value: 96.177
1665
- task:
1666
  type: Retrieval
1667
- - dataset:
1668
- config: default
1669
  name: MTEB FiQA2018
1670
- revision: 27a168819829fe9bcd655c2df245fb19452e8e06
1671
- split: test
1672
  type: mteb/fiqa
 
 
 
1673
  metrics:
1674
  - type: main_score
1675
  value: 60.480000000000004
@@ -1953,14 +1962,14 @@ model-index:
1953
  value: 50.221000000000004
1954
  - type: recall_at_5
1955
  value: 58.209999999999994
1956
- task:
1957
  type: Retrieval
1958
- - dataset:
1959
- config: default
1960
  name: MTEB HotpotQA
1961
- revision: ab518f4d6fcca38d87c25209f94beba119d02014
1962
- split: test
1963
  type: mteb/hotpotqa
 
 
 
1964
  metrics:
1965
  - type: main_score
1966
  value: 76.67399999999999
@@ -2244,14 +2253,14 @@ model-index:
2244
  value: 68.879
2245
  - type: recall_at_5
2246
  value: 73.896
2247
- task:
2248
- type: Retrieval
2249
- - dataset:
2250
- config: default
2251
  name: MTEB ImdbClassification
2252
- revision: 3d86128a09e091d6018b6d26cad27f2739fc2db7
2253
- split: test
2254
  type: mteb/imdb
 
 
 
2255
  metrics:
2256
  - type: accuracy
2257
  value: 96.6608
@@ -2265,14 +2274,14 @@ model-index:
2265
  value: 96.66029695623423
2266
  - type: main_score
2267
  value: 96.6608
2268
- task:
2269
- type: Classification
2270
- - dataset:
2271
- config: default
2272
  name: MTEB MSMARCO
2273
- revision: c5a29a104738b98a9e76336939199e264163d4a0
2274
- split: dev
2275
  type: mteb/msmarco
 
 
 
2276
  metrics:
2277
  - type: main_score
2278
  value: 45.217
@@ -2556,14 +2565,14 @@ model-index:
2556
  value: 45.535
2557
  - type: recall_at_5
2558
  value: 55.394
2559
- task:
2560
- type: Retrieval
2561
- - dataset:
2562
- config: en
2563
  name: MTEB MTOPDomainClassification (en)
2564
- revision: d80d48c1eb48d3562165c59d59d0034df9fff0bf
2565
- split: test
2566
  type: mteb/mtop_domain
 
 
 
2567
  metrics:
2568
  - type: accuracy
2569
  value: 99.01276789785682
@@ -2573,14 +2582,14 @@ model-index:
2573
  value: 99.01406884928141
2574
  - type: main_score
2575
  value: 99.01276789785682
2576
- task:
2577
  type: Classification
2578
- - dataset:
2579
- config: en
2580
  name: MTEB MTOPIntentClassification (en)
2581
- revision: ae001d0e6b1228650b7bd1c2c65fb50ad11a8aba
2582
- split: test
2583
  type: mteb/mtop_intent
 
 
 
2584
  metrics:
2585
  - type: accuracy
2586
  value: 92.78385772913816
@@ -2590,14 +2599,14 @@ model-index:
2590
  value: 93.90424147486428
2591
  - type: main_score
2592
  value: 92.78385772913816
2593
- task:
2594
  type: Classification
2595
- - dataset:
2596
- config: en
2597
  name: MTEB MassiveIntentClassification (en)
2598
- revision: 4672e20407010da34463acc759c162ca9734bca6
2599
- split: test
2600
  type: mteb/amazon_massive_intent
 
 
 
2601
  metrics:
2602
  - type: accuracy
2603
  value: 85.83053127101546
@@ -2607,14 +2616,14 @@ model-index:
2607
  value: 85.81759723866098
2608
  - type: main_score
2609
  value: 85.83053127101546
2610
- task:
2611
  type: Classification
2612
- - dataset:
2613
- config: en
2614
  name: MTEB MassiveScenarioClassification (en)
2615
- revision: fad2c6e8459f9e1c45d9315f4953d921437d70f8
2616
- split: test
2617
  type: mteb/amazon_massive_scenario
 
 
 
2618
  metrics:
2619
  - type: accuracy
2620
  value: 90.19838601210489
@@ -2624,14 +2633,14 @@ model-index:
2624
  value: 90.11422965504119
2625
  - type: main_score
2626
  value: 90.19838601210489
2627
- task:
2628
- type: Classification
2629
- - dataset:
2630
- config: default
2631
  name: MTEB MedrxivClusteringP2P
2632
- revision: e7a26af6f3ae46b30dde8737f02c07b1505bcc73
2633
- split: test
2634
  type: mteb/medrxiv-clustering-p2p
 
 
 
2635
  metrics:
2636
  - type: main_score
2637
  value: 46.866746897607094
@@ -2639,14 +2648,14 @@ model-index:
2639
  value: 46.866746897607094
2640
  - type: v_measure_std
2641
  value: 1.0966477896919726
2642
- task:
2643
  type: Clustering
2644
- - dataset:
2645
- config: default
2646
  name: MTEB MedrxivClusteringS2S
2647
- revision: 35191c8c0dca72d8ff3efcd72aa802307d469663
2648
- split: test
2649
  type: mteb/medrxiv-clustering-s2s
 
 
 
2650
  metrics:
2651
  - type: main_score
2652
  value: 44.6538827415503
@@ -2654,14 +2663,14 @@ model-index:
2654
  value: 44.6538827415503
2655
  - type: v_measure_std
2656
  value: 1.1649569936599116
2657
- task:
2658
- type: Clustering
2659
- - dataset:
2660
- config: default
2661
  name: MTEB MindSmallReranking
2662
- revision: 59042f120c80e8afa9cdbb224f67076cec0fc9a7
2663
- split: test
2664
  type: mteb/mind_small
 
 
 
2665
  metrics:
2666
  - type: main_score
2667
  value: 33.05449204940555
@@ -2681,14 +2690,14 @@ model-index:
2681
  value: -15.304687384645769
2682
  - type: nAUC_mrr_std
2683
  value: -0.519919931348978
2684
- task:
2685
- type: Reranking
2686
- - dataset:
2687
- config: default
2688
  name: MTEB NFCorpus
2689
- revision: ec0fa4fe99da2ff19ca1214b7966684033a58814
2690
- split: test
2691
  type: mteb/nfcorpus
 
 
 
2692
  metrics:
2693
  - type: main_score
2694
  value: 41.998000000000005
@@ -2972,14 +2981,14 @@ model-index:
2972
  value: 13.267999999999999
2973
  - type: recall_at_5
2974
  value: 16.141
2975
- task:
2976
  type: Retrieval
2977
- - dataset:
2978
- config: default
2979
  name: MTEB NQ
2980
- revision: b774495ed302d8c44a3a7ea25c90dbce03968f31
2981
- split: test
2982
  type: mteb/nq
 
 
 
2983
  metrics:
2984
  - type: main_score
2985
  value: 71.8
@@ -3263,14 +3272,14 @@ model-index:
3263
  value: 74.394
3264
  - type: recall_at_5
3265
  value: 82.711
3266
- task:
3267
  type: Retrieval
3268
- - dataset:
3269
- config: default
3270
  name: MTEB QuoraRetrieval
3271
- revision: e4e08e0b7dbe3c8700f0daef558ff32256715259
3272
- split: test
3273
  type: mteb/quora
 
 
 
3274
  metrics:
3275
  - type: main_score
3276
  value: 90.025
@@ -3554,14 +3563,14 @@ model-index:
3554
  value: 89.276
3555
  - type: recall_at_5
3556
  value: 93.46
3557
- task:
3558
- type: Retrieval
3559
- - dataset:
3560
- config: default
3561
  name: MTEB RedditClustering
3562
- revision: 24640382cdbf8abc73003fb0fa6d111a705499eb
3563
- split: test
3564
  type: mteb/reddit-clustering
 
 
 
3565
  metrics:
3566
  - type: main_score
3567
  value: 72.86492101891123
@@ -3569,14 +3578,14 @@ model-index:
3569
  value: 72.86492101891123
3570
  - type: v_measure_std
3571
  value: 2.778711445144635
3572
- task:
3573
  type: Clustering
3574
- - dataset:
3575
- config: default
3576
  name: MTEB RedditClusteringP2P
3577
- revision: 385e3cb46b4cfa89021f56c4380204149d0efe33
3578
- split: test
3579
  type: mteb/reddit-clustering-p2p
 
 
 
3580
  metrics:
3581
  - type: main_score
3582
  value: 75.27316726548479
@@ -3584,14 +3593,14 @@ model-index:
3584
  value: 75.27316726548479
3585
  - type: v_measure_std
3586
  value: 8.87871936725338
3587
- task:
3588
- type: Clustering
3589
- - dataset:
3590
- config: default
3591
  name: MTEB SCIDOCS
3592
- revision: f8c2fcf00f625baaa80f62ec5bd9e1fff3b8ae88
3593
- split: test
3594
  type: mteb/scidocs
 
 
 
3595
  metrics:
3596
  - type: main_score
3597
  value: 26.638
@@ -3875,14 +3884,14 @@ model-index:
3875
  value: 14.127999999999998
3876
  - type: recall_at_5
3877
  value: 19.673
3878
- task:
3879
- type: Retrieval
3880
- - dataset:
3881
- config: default
3882
  name: MTEB SICK-R
3883
- revision: 20a6d6f312dd54037fe07a32d58e5e168867909d
3884
- split: test
3885
  type: mteb/sickr-sts
 
 
 
3886
  metrics:
3887
  - type: cosine_pearson
3888
  value: 86.86608529160739
@@ -3902,14 +3911,14 @@ model-index:
3902
  value: 86.86608529160739
3903
  - type: spearman
3904
  value: 82.88625166203383
3905
- task:
3906
  type: STS
3907
- - dataset:
3908
- config: default
3909
  name: MTEB STS12
3910
- revision: a0d554a64d88156834ff5ae9920b964011b16384
3911
- split: test
3912
  type: mteb/sts12-sts
 
 
 
3913
  metrics:
3914
  - type: cosine_pearson
3915
  value: 87.0445014940449
@@ -3929,14 +3938,14 @@ model-index:
3929
  value: 87.0445014940449
3930
  - type: spearman
3931
  value: 80.0880365116599
3932
- task:
3933
  type: STS
3934
- - dataset:
3935
- config: default
3936
  name: MTEB STS13
3937
- revision: 7e90230a92c190f1bf69ae9002b8cea547a64cca
3938
- split: test
3939
  type: mteb/sts13-sts
 
 
 
3940
  metrics:
3941
  - type: cosine_pearson
3942
  value: 89.33900828959968
@@ -3956,14 +3965,14 @@ model-index:
3956
  value: 89.33900828959968
3957
  - type: spearman
3958
  value: 89.68256358526733
3959
- task:
3960
  type: STS
3961
- - dataset:
3962
- config: default
3963
  name: MTEB STS14
3964
- revision: 6031580fec1f6af667f0bd2da0a551cf4f0b2375
3965
- split: test
3966
  type: mteb/sts14-sts
 
 
 
3967
  metrics:
3968
  - type: cosine_pearson
3969
  value: 86.42029843639123
@@ -3983,14 +3992,14 @@ model-index:
3983
  value: 86.42029843639123
3984
  - type: spearman
3985
  value: 85.0707889220723
3986
- task:
3987
  type: STS
3988
- - dataset:
3989
- config: default
3990
  name: MTEB STS15
3991
- revision: ae752c7c21bf194d8b67fd573edf7ae58183cbe3
3992
- split: test
3993
  type: mteb/sts15-sts
 
 
 
3994
  metrics:
3995
  - type: cosine_pearson
3996
  value: 88.3660081271444
@@ -4010,14 +4019,14 @@ model-index:
4010
  value: 88.3660081271444
4011
  - type: spearman
4012
  value: 89.39375083609528
4013
- task:
4014
  type: STS
4015
- - dataset:
4016
- config: default
4017
  name: MTEB STS16
4018
- revision: 4d8694f8f0e0100860b497b999b3dbed754a0513
4019
- split: test
4020
  type: mteb/sts16-sts
 
 
 
4021
  metrics:
4022
  - type: cosine_pearson
4023
  value: 85.60708247171874
@@ -4037,14 +4046,14 @@ model-index:
4037
  value: 85.60708247171874
4038
  - type: spearman
4039
  value: 87.15234952832193
4040
- task:
4041
  type: STS
4042
- - dataset:
4043
- config: en-en
4044
  name: MTEB STS17 (en-en)
4045
- revision: faeb762787bd10488a50c8b5be4a3b82e411949c
4046
- split: test
4047
  type: mteb/sts17-crosslingual-sts
 
 
 
4048
  metrics:
4049
  - type: cosine_pearson
4050
  value: 91.25898556808458
@@ -4064,14 +4073,14 @@ model-index:
4064
  value: 91.25898556808458
4065
  - type: spearman
4066
  value: 91.35372390581641
4067
- task:
4068
  type: STS
4069
- - dataset:
4070
- config: en
4071
  name: MTEB STS22 (en)
4072
- revision: de9d86b3b84231dc21f76c7b7af1f28e2f57f6e3
4073
- split: test
4074
  type: mteb/sts22-crosslingual-sts
 
 
 
4075
  metrics:
4076
  - type: cosine_pearson
4077
  value: 67.61637111515797
@@ -4091,14 +4100,14 @@ model-index:
4091
  value: 67.61637111515797
4092
  - type: spearman
4093
  value: 68.10379096526697
4094
- task:
4095
  type: STS
4096
- - dataset:
4097
- config: default
4098
  name: MTEB STSBenchmark
4099
- revision: b0fddb56ed78048fa8b90373c8a3cfc37b684831
4100
- split: test
4101
  type: mteb/stsbenchmark-sts
 
 
 
4102
  metrics:
4103
  - type: cosine_pearson
4104
  value: 87.81592853782297
@@ -4118,14 +4127,14 @@ model-index:
4118
  value: 87.81592853782297
4119
  - type: spearman
4120
  value: 88.2302550329183
4121
- task:
4122
- type: STS
4123
- - dataset:
4124
- config: default
4125
  name: MTEB SciDocsRR
4126
- revision: d3c5e1fc0b855ab6097bf1cda04dd73947d7caab
4127
- split: test
4128
  type: mteb/scidocs-reranking
 
 
 
4129
  metrics:
4130
  - type: main_score
4131
  value: 89.196009707431
@@ -4145,14 +4154,14 @@ model-index:
4145
  value: 86.38341077184032
4146
  - type: nAUC_mrr_std
4147
  value: 75.38945014727746
4148
- task:
4149
- type: Reranking
4150
- - dataset:
4151
- config: default
4152
  name: MTEB SciFact
4153
- revision: 0228b52cf27578f30900b9e5271d331663a030d7
4154
- split: test
4155
  type: mteb/scifact
 
 
 
4156
  metrics:
4157
  - type: main_score
4158
  value: 80.08999999999999
@@ -4436,14 +4445,14 @@ model-index:
4436
  value: 80.972
4437
  - type: recall_at_5
4438
  value: 89.90599999999999
4439
- task:
4440
- type: Retrieval
4441
- - dataset:
4442
- config: default
4443
  name: MTEB SprintDuplicateQuestions
4444
- revision: d66bd1f72af766a5cc4b0ca5e00c162f89e8cc46
4445
- split: test
4446
  type: mteb/sprintduplicatequestions-pairclassification
 
 
 
4447
  metrics:
4448
  - type: cosine_accuracy
4449
  value: 99.81881188118813
@@ -4525,14 +4534,14 @@ model-index:
4525
  value: 92.59645464025026
4526
  - type: similarity_recall
4527
  value: 88.8
4528
- task:
4529
- type: PairClassification
4530
- - dataset:
4531
- config: default
4532
  name: MTEB StackExchangeClustering
4533
- revision: 6cbc1f7b2bc0622f2e39d2c77fa502909748c259
4534
- split: test
4535
  type: mteb/stackexchange-clustering
 
 
 
4536
  metrics:
4537
  - type: main_score
4538
  value: 80.28558559137414
@@ -4540,14 +4549,14 @@ model-index:
4540
  value: 80.28558559137414
4541
  - type: v_measure_std
4542
  value: 2.795276520287584
4543
- task:
4544
  type: Clustering
4545
- - dataset:
4546
- config: default
4547
  name: MTEB StackExchangeClusteringP2P
4548
- revision: 815ca46b2622cec33ccafc3735d572c266efdb44
4549
- split: test
4550
  type: mteb/stackexchange-clustering-p2p
 
 
 
4551
  metrics:
4552
  - type: main_score
4553
  value: 49.57135582416209
@@ -4555,14 +4564,14 @@ model-index:
4555
  value: 49.57135582416209
4556
  - type: v_measure_std
4557
  value: 1.6414135468423754
4558
- task:
4559
- type: Clustering
4560
- - dataset:
4561
- config: default
4562
  name: MTEB StackOverflowDupQuestions
4563
- revision: e185fbe320c72810689fc5848eb6114e1ef5ec69
4564
- split: test
4565
  type: mteb/stackoverflowdupquestions-reranking
 
 
 
4566
  metrics:
4567
  - type: main_score
4568
  value: 55.253002583598644
@@ -4582,14 +4591,14 @@ model-index:
4582
  value: 10.586310195339053
4583
  - type: nAUC_mrr_std
4584
  value: 8.47326494370076
4585
- task:
4586
- type: Reranking
4587
- - dataset:
4588
- config: default
4589
  name: MTEB SummEval
4590
- revision: cda12ad7615edc362dbf25a00fdd61d3b1eaf93c
4591
- split: test
4592
  type: mteb/summeval
 
 
 
4593
  metrics:
4594
  - type: cosine_pearson
4595
  value: 31.19874648747059
@@ -4605,14 +4614,14 @@ model-index:
4605
  value: 31.19874648747059
4606
  - type: spearman
4607
  value: 31.493550648844863
4608
- task:
4609
- type: Summarization
4610
- - dataset:
4611
- config: default
4612
  name: MTEB TRECCOVID
4613
- revision: bb9466bac8153a0349341eb1b22e06409e78ef4e
4614
- split: test
4615
  type: mteb/trec-covid
 
 
 
4616
  metrics:
4617
  - type: main_score
4618
  value: 85.983
@@ -4896,14 +4905,14 @@ model-index:
4896
  value: 0.7250000000000001
4897
  - type: recall_at_5
4898
  value: 1.1820000000000002
4899
- task:
4900
  type: Retrieval
4901
- - dataset:
4902
- config: default
4903
  name: MTEB Touche2020
4904
- revision: a34f9a33db75fa0cbb21bb5cfc3dae8dc8bec93f
4905
- split: test
4906
  type: mteb/touche2020
 
 
 
4907
  metrics:
4908
  - type: main_score
4909
  value: 29.944
@@ -5187,14 +5196,14 @@ model-index:
5187
  value: 7.383000000000001
5188
  - type: recall_at_5
5189
  value: 11.434
5190
- task:
5191
- type: Retrieval
5192
- - dataset:
5193
- config: default
5194
  name: MTEB ToxicConversationsClassification
5195
- revision: edfaf9da55d3dd50d43143d90c1ac476895ae6de
5196
- split: test
5197
  type: mteb/toxic_conversations_50k
 
 
 
5198
  metrics:
5199
  - type: accuracy
5200
  value: 88.759765625
@@ -5208,14 +5217,14 @@ model-index:
5208
  value: 90.54372649306606
5209
  - type: main_score
5210
  value: 88.759765625
5211
- task:
5212
  type: Classification
5213
- - dataset:
5214
- config: default
5215
  name: MTEB TweetSentimentExtractionClassification
5216
- revision: d604517c81ca91fe16a244d1248fc021f9ecee7a
5217
- split: test
5218
  type: mteb/tweet_sentiment_extraction
 
 
 
5219
  metrics:
5220
  - type: accuracy
5221
  value: 74.8443689869836
@@ -5225,14 +5234,14 @@ model-index:
5225
  value: 74.7369003946243
5226
  - type: main_score
5227
  value: 74.8443689869836
5228
- task:
5229
- type: Classification
5230
- - dataset:
5231
- config: default
5232
  name: MTEB TwentyNewsgroupsClustering
5233
- revision: 6125ec4e24fa026cec8a478383ee943acfbd5449
5234
- split: test
5235
  type: mteb/twentynewsgroups-clustering
 
 
 
5236
  metrics:
5237
  - type: main_score
5238
  value: 61.42918790942448
@@ -5240,14 +5249,14 @@ model-index:
5240
  value: 61.42918790942448
5241
  - type: v_measure_std
5242
  value: 1.0156550098843082
5243
- task:
5244
- type: Clustering
5245
- - dataset:
5246
- config: default
5247
  name: MTEB TwitterSemEval2015
5248
- revision: 70970daeab8776df92f5ea462b6173c0b46fd2d1
5249
- split: test
5250
  type: mteb/twittersemeval2015-pairclassification
 
 
 
5251
  metrics:
5252
  - type: cosine_accuracy
5253
  value: 88.22197055492639
@@ -5329,14 +5338,14 @@ model-index:
5329
  value: 71.64922770303936
5330
  - type: similarity_recall
5331
  value: 75.8839050131926
5332
- task:
5333
  type: PairClassification
5334
- - dataset:
5335
- config: default
5336
  name: MTEB TwitterURLCorpus
5337
- revision: 8b6510b0b1fa4e4c4f879467980e9be563ec1cdf
5338
- split: test
5339
  type: mteb/twitterurlcorpus-pairclassification
 
 
 
5340
  metrics:
5341
  - type: cosine_accuracy
5342
  value: 89.88628866379477
@@ -5418,14 +5427,6 @@ model-index:
5418
  value: 76.93126197063205
5419
  - type: similarity_recall
5420
  value: 83.50015398829689
5421
- task:
5422
- type: PairClassification
5423
- tags:
5424
- - mteb
5425
- - sentence-transformers
5426
- - transformers
5427
- - sentence-similarity
5428
- license: mit
5429
  ---
5430
 
5431
 
 
1
  ---
2
+ tags:
3
+ - mteb
4
+ - sentence-transformers
5
+ - transformers
6
+ - sentence-similarity
7
+ - onnx
8
+ license: mit
9
  model-index:
10
  - name: stella_en_1.5B_v5
11
  results:
12
+ - task:
13
+ type: Classification
14
+ dataset:
15
  name: MTEB AmazonCounterfactualClassification (en)
 
 
16
  type: mteb/amazon_counterfactual
17
+ config: en
18
+ split: test
19
+ revision: e8379541af4e31359cca9fbcf4b00f2671dba205
20
  metrics:
21
  - type: accuracy
22
  value: 92.86567164179104
 
30
  value: 93.13621183004571
31
  - type: main_score
32
  value: 92.86567164179104
33
+ - task:
34
  type: Classification
35
+ dataset:
 
36
  name: MTEB AmazonPolarityClassification
 
 
37
  type: mteb/amazon_polarity
38
+ config: default
39
+ split: test
40
+ revision: e2d317d38cd51312af73b3d32a06d1a08b442046
41
  metrics:
42
  - type: accuracy
43
  value: 97.16485
 
51
  value: 97.16351087403213
52
  - type: main_score
53
  value: 97.16485
54
+ - task:
55
  type: Classification
56
+ dataset:
 
57
  name: MTEB AmazonReviewsClassification (en)
 
 
58
  type: mteb/amazon_reviews_multi
59
+ config: en
60
+ split: test
61
+ revision: 1399c76144fd37290681b995c656ef9b2e06e26d
62
  metrics:
63
  - type: accuracy
64
  value: 59.358
 
68
  value: 59.0264615883114
69
  - type: main_score
70
  value: 59.358
71
+ - task:
72
+ type: Retrieval
73
+ dataset:
 
74
  name: MTEB ArguAna
 
 
75
  type: mteb/arguana
76
+ config: default
77
+ split: test
78
+ revision: c22ab2a51041ffd869aaddef7af8d8215647e41a
79
  metrics:
80
  - type: main_score
81
  value: 65.269
 
359
  value: 67.354
360
  - type: recall_at_5
361
  value: 78.236
362
+ - task:
363
+ type: Clustering
364
+ dataset:
 
365
  name: MTEB ArxivClusteringP2P
 
 
366
  type: mteb/arxiv-clustering-p2p
367
+ config: default
368
+ split: test
369
+ revision: a122ad7f3f0291bf49cc6f4d32aa80929df69d5d
370
  metrics:
371
  - type: main_score
372
  value: 55.437138353189994
 
374
  value: 55.437138353189994
375
  - type: v_measure_std
376
  value: 14.718556601335491
377
+ - task:
378
  type: Clustering
379
+ dataset:
 
380
  name: MTEB ArxivClusteringS2S
 
 
381
  type: mteb/arxiv-clustering-s2s
382
+ config: default
383
+ split: test
384
+ revision: f910caf1a6075f7329cdf8c1a6135696f37dbd53
385
  metrics:
386
  - type: main_score
387
  value: 50.65858459544658
 
389
  value: 50.65858459544658
390
  - type: v_measure_std
391
  value: 14.887033747525146
392
+ - task:
393
+ type: Reranking
394
+ dataset:
 
395
  name: MTEB AskUbuntuDupQuestions
 
 
396
  type: mteb/askubuntudupquestions-reranking
397
+ config: default
398
+ split: test
399
+ revision: 2000358ca161889fa9c082cb41daa8dcfb161a54
400
  metrics:
401
  - type: main_score
402
  value: 67.32597152838535
 
416
  value: 41.64561939958336
417
  - type: nAUC_mrr_std
418
  value: 23.179909345891968
419
+ - task:
420
+ type: STS
421
+ dataset:
 
422
  name: MTEB BIOSSES
 
 
423
  type: mteb/biosses-sts
424
+ config: default
425
+ split: test
426
+ revision: d3fb88f8f02e40887cd149695127462bbcf29b4a
427
  metrics:
428
  - type: cosine_pearson
429
  value: 85.790820496042
 
443
  value: 85.790820496042
444
  - type: spearman
445
  value: 83.10731534330517
446
+ - task:
447
+ type: Classification
448
+ dataset:
 
449
  name: MTEB Banking77Classification
 
 
450
  type: mteb/banking77
451
+ config: default
452
+ split: test
453
+ revision: 0fd18e25b25c072e09e0d92ab615fda904d66300
454
  metrics:
455
  - type: accuracy
456
  value: 89.78896103896105
 
460
  value: 89.76107366333488
461
  - type: main_score
462
  value: 89.78896103896105
463
+ - task:
464
+ type: Clustering
465
+ dataset:
 
466
  name: MTEB BiorxivClusteringP2P
 
 
467
  type: mteb/biorxiv-clustering-p2p
468
+ config: default
469
+ split: test
470
+ revision: 65b79d1d13f80053f67aca9498d9402c2d9f1f40
471
  metrics:
472
  - type: main_score
473
  value: 50.68092296236376
 
475
  value: 50.68092296236376
476
  - type: v_measure_std
477
  value: 0.7832640983085436
478
+ - task:
479
  type: Clustering
480
+ dataset:
 
481
  name: MTEB BiorxivClusteringS2S
 
 
482
  type: mteb/biorxiv-clustering-s2s
483
+ config: default
484
+ split: test
485
+ revision: 258694dd0231531bc1fd9de6ceb52a0853c6d908
486
  metrics:
487
  - type: main_score
488
  value: 46.86629236732983
 
490
  value: 46.86629236732983
491
  - type: v_measure_std
492
  value: 0.8784322236350974
493
+ - task:
494
+ type: Retrieval
495
+ dataset:
 
496
  name: MTEB CQADupstackRetrieval
 
 
497
  type: mteb/cqadupstack
498
+ config: default
499
+ split: test
500
+ revision: 4ffe81d471b1924886b33c7567bfb200e9eec5c4
501
  metrics:
502
  - type: main_score
503
  value: 47.74883333333334
 
781
  value: 46.01841666666666
782
  - type: recall_at_5
783
  value: 52.482416666666666
784
+ - task:
785
  type: Retrieval
786
+ dataset:
 
787
  name: MTEB ClimateFEVER
 
 
788
  type: mteb/climate-fever
789
+ config: default
790
+ split: test
791
+ revision: 47f2ac6acb640fc46020b02a5b59fdda04d39380
792
  metrics:
793
  - type: main_score
794
  value: 46.113
 
1072
  value: 35.150999999999996
1073
  - type: recall_at_5
1074
  value: 42.748000000000005
1075
+ - task:
1076
  type: Retrieval
1077
+ dataset:
 
1078
  name: MTEB DBPedia
 
 
1079
  type: mteb/dbpedia
1080
+ config: default
1081
+ split: test
1082
+ revision: c0f706b76e590d620bd6618b3ca8efdd34e2d659
1083
  metrics:
1084
  - type: main_score
1085
  value: 52.276999999999994
 
1363
  value: 17.876
1364
  - type: recall_at_5
1365
  value: 22.536
1366
+ - task:
1367
+ type: Classification
1368
+ dataset:
 
1369
  name: MTEB EmotionClassification
 
 
1370
  type: mteb/emotion
1371
+ config: default
1372
+ split: test
1373
+ revision: 4f58c6b202a23cf9a4da393831edf4f9183cad37
1374
  metrics:
1375
  - type: accuracy
1376
  value: 84.29499999999999
 
1380
  value: 84.96026012933847
1381
  - type: main_score
1382
  value: 84.29499999999999
1383
+ - task:
1384
+ type: Retrieval
1385
+ dataset:
 
1386
  name: MTEB FEVER
 
 
1387
  type: mteb/fever
1388
+ config: default
1389
+ split: test
1390
+ revision: bea83ef9e8fb933d90a2f1d5515737465d613e12
1391
  metrics:
1392
  - type: main_score
1393
  value: 94.83200000000001
 
1671
  value: 95.069
1672
  - type: recall_at_5
1673
  value: 96.177
1674
+ - task:
1675
  type: Retrieval
1676
+ dataset:
 
1677
  name: MTEB FiQA2018
 
 
1678
  type: mteb/fiqa
1679
+ config: default
1680
+ split: test
1681
+ revision: 27a168819829fe9bcd655c2df245fb19452e8e06
1682
  metrics:
1683
  - type: main_score
1684
  value: 60.480000000000004
 
1962
  value: 50.221000000000004
1963
  - type: recall_at_5
1964
  value: 58.209999999999994
1965
+ - task:
1966
  type: Retrieval
1967
+ dataset:
 
1968
  name: MTEB HotpotQA
 
 
1969
  type: mteb/hotpotqa
1970
+ config: default
1971
+ split: test
1972
+ revision: ab518f4d6fcca38d87c25209f94beba119d02014
1973
  metrics:
1974
  - type: main_score
1975
  value: 76.67399999999999
 
2253
  value: 68.879
2254
  - type: recall_at_5
2255
  value: 73.896
2256
+ - task:
2257
+ type: Classification
2258
+ dataset:
 
2259
  name: MTEB ImdbClassification
 
 
2260
  type: mteb/imdb
2261
+ config: default
2262
+ split: test
2263
+ revision: 3d86128a09e091d6018b6d26cad27f2739fc2db7
2264
  metrics:
2265
  - type: accuracy
2266
  value: 96.6608
 
2274
  value: 96.66029695623423
2275
  - type: main_score
2276
  value: 96.6608
2277
+ - task:
2278
+ type: Retrieval
2279
+ dataset:
 
2280
  name: MTEB MSMARCO
 
 
2281
  type: mteb/msmarco
2282
+ config: default
2283
+ split: dev
2284
+ revision: c5a29a104738b98a9e76336939199e264163d4a0
2285
  metrics:
2286
  - type: main_score
2287
  value: 45.217
 
2565
  value: 45.535
2566
  - type: recall_at_5
2567
  value: 55.394
2568
+ - task:
2569
+ type: Classification
2570
+ dataset:
 
2571
  name: MTEB MTOPDomainClassification (en)
 
 
2572
  type: mteb/mtop_domain
2573
+ config: en
2574
+ split: test
2575
+ revision: d80d48c1eb48d3562165c59d59d0034df9fff0bf
2576
  metrics:
2577
  - type: accuracy
2578
  value: 99.01276789785682
 
2582
  value: 99.01406884928141
2583
  - type: main_score
2584
  value: 99.01276789785682
2585
+ - task:
2586
  type: Classification
2587
+ dataset:
 
2588
  name: MTEB MTOPIntentClassification (en)
 
 
2589
  type: mteb/mtop_intent
2590
+ config: en
2591
+ split: test
2592
+ revision: ae001d0e6b1228650b7bd1c2c65fb50ad11a8aba
2593
  metrics:
2594
  - type: accuracy
2595
  value: 92.78385772913816
 
2599
  value: 93.90424147486428
2600
  - type: main_score
2601
  value: 92.78385772913816
2602
+ - task:
2603
  type: Classification
2604
+ dataset:
 
2605
  name: MTEB MassiveIntentClassification (en)
 
 
2606
  type: mteb/amazon_massive_intent
2607
+ config: en
2608
+ split: test
2609
+ revision: 4672e20407010da34463acc759c162ca9734bca6
2610
  metrics:
2611
  - type: accuracy
2612
  value: 85.83053127101546
 
2616
  value: 85.81759723866098
2617
  - type: main_score
2618
  value: 85.83053127101546
2619
+ - task:
2620
  type: Classification
2621
+ dataset:
 
2622
  name: MTEB MassiveScenarioClassification (en)
 
 
2623
  type: mteb/amazon_massive_scenario
2624
+ config: en
2625
+ split: test
2626
+ revision: fad2c6e8459f9e1c45d9315f4953d921437d70f8
2627
  metrics:
2628
  - type: accuracy
2629
  value: 90.19838601210489
 
2633
  value: 90.11422965504119
2634
  - type: main_score
2635
  value: 90.19838601210489
2636
+ - task:
2637
+ type: Clustering
2638
+ dataset:
 
2639
  name: MTEB MedrxivClusteringP2P
 
 
2640
  type: mteb/medrxiv-clustering-p2p
2641
+ config: default
2642
+ split: test
2643
+ revision: e7a26af6f3ae46b30dde8737f02c07b1505bcc73
2644
  metrics:
2645
  - type: main_score
2646
  value: 46.866746897607094
 
2648
  value: 46.866746897607094
2649
  - type: v_measure_std
2650
  value: 1.0966477896919726
2651
+ - task:
2652
  type: Clustering
2653
+ dataset:
 
2654
  name: MTEB MedrxivClusteringS2S
 
 
2655
  type: mteb/medrxiv-clustering-s2s
2656
+ config: default
2657
+ split: test
2658
+ revision: 35191c8c0dca72d8ff3efcd72aa802307d469663
2659
  metrics:
2660
  - type: main_score
2661
  value: 44.6538827415503
 
2663
  value: 44.6538827415503
2664
  - type: v_measure_std
2665
  value: 1.1649569936599116
2666
+ - task:
2667
+ type: Reranking
2668
+ dataset:
 
2669
  name: MTEB MindSmallReranking
 
 
2670
  type: mteb/mind_small
2671
+ config: default
2672
+ split: test
2673
+ revision: 59042f120c80e8afa9cdbb224f67076cec0fc9a7
2674
  metrics:
2675
  - type: main_score
2676
  value: 33.05449204940555
 
2690
  value: -15.304687384645769
2691
  - type: nAUC_mrr_std
2692
  value: -0.519919931348978
2693
+ - task:
2694
+ type: Retrieval
2695
+ dataset:
 
2696
  name: MTEB NFCorpus
 
 
2697
  type: mteb/nfcorpus
2698
+ config: default
2699
+ split: test
2700
+ revision: ec0fa4fe99da2ff19ca1214b7966684033a58814
2701
  metrics:
2702
  - type: main_score
2703
  value: 41.998000000000005
 
2981
  value: 13.267999999999999
2982
  - type: recall_at_5
2983
  value: 16.141
2984
+ - task:
2985
  type: Retrieval
2986
+ dataset:
 
2987
  name: MTEB NQ
 
 
2988
  type: mteb/nq
2989
+ config: default
2990
+ split: test
2991
+ revision: b774495ed302d8c44a3a7ea25c90dbce03968f31
2992
  metrics:
2993
  - type: main_score
2994
  value: 71.8
 
3272
  value: 74.394
3273
  - type: recall_at_5
3274
  value: 82.711
3275
+ - task:
3276
  type: Retrieval
3277
+ dataset:
 
3278
  name: MTEB QuoraRetrieval
 
 
3279
  type: mteb/quora
3280
+ config: default
3281
+ split: test
3282
+ revision: e4e08e0b7dbe3c8700f0daef558ff32256715259
3283
  metrics:
3284
  - type: main_score
3285
  value: 90.025
 
3563
  value: 89.276
3564
  - type: recall_at_5
3565
  value: 93.46
3566
+ - task:
3567
+ type: Clustering
3568
+ dataset:
 
3569
  name: MTEB RedditClustering
 
 
3570
  type: mteb/reddit-clustering
3571
+ config: default
3572
+ split: test
3573
+ revision: 24640382cdbf8abc73003fb0fa6d111a705499eb
3574
  metrics:
3575
  - type: main_score
3576
  value: 72.86492101891123
 
3578
  value: 72.86492101891123
3579
  - type: v_measure_std
3580
  value: 2.778711445144635
3581
+ - task:
3582
  type: Clustering
3583
+ dataset:
 
3584
  name: MTEB RedditClusteringP2P
 
 
3585
  type: mteb/reddit-clustering-p2p
3586
+ config: default
3587
+ split: test
3588
+ revision: 385e3cb46b4cfa89021f56c4380204149d0efe33
3589
  metrics:
3590
  - type: main_score
3591
  value: 75.27316726548479
 
3593
  value: 75.27316726548479
3594
  - type: v_measure_std
3595
  value: 8.87871936725338
3596
+ - task:
3597
+ type: Retrieval
3598
+ dataset:
 
3599
  name: MTEB SCIDOCS
 
 
3600
  type: mteb/scidocs
3601
+ config: default
3602
+ split: test
3603
+ revision: f8c2fcf00f625baaa80f62ec5bd9e1fff3b8ae88
3604
  metrics:
3605
  - type: main_score
3606
  value: 26.638
 
3884
  value: 14.127999999999998
3885
  - type: recall_at_5
3886
  value: 19.673
3887
+ - task:
3888
+ type: STS
3889
+ dataset:
 
3890
  name: MTEB SICK-R
 
 
3891
  type: mteb/sickr-sts
3892
+ config: default
3893
+ split: test
3894
+ revision: 20a6d6f312dd54037fe07a32d58e5e168867909d
3895
  metrics:
3896
  - type: cosine_pearson
3897
  value: 86.86608529160739
 
3911
  value: 86.86608529160739
3912
  - type: spearman
3913
  value: 82.88625166203383
3914
+ - task:
3915
  type: STS
3916
+ dataset:
 
3917
  name: MTEB STS12
 
 
3918
  type: mteb/sts12-sts
3919
+ config: default
3920
+ split: test
3921
+ revision: a0d554a64d88156834ff5ae9920b964011b16384
3922
  metrics:
3923
  - type: cosine_pearson
3924
  value: 87.0445014940449
 
3938
  value: 87.0445014940449
3939
  - type: spearman
3940
  value: 80.0880365116599
3941
+ - task:
3942
  type: STS
3943
+ dataset:
 
3944
  name: MTEB STS13
 
 
3945
  type: mteb/sts13-sts
3946
+ config: default
3947
+ split: test
3948
+ revision: 7e90230a92c190f1bf69ae9002b8cea547a64cca
3949
  metrics:
3950
  - type: cosine_pearson
3951
  value: 89.33900828959968
 
3965
  value: 89.33900828959968
3966
  - type: spearman
3967
  value: 89.68256358526733
3968
+ - task:
3969
  type: STS
3970
+ dataset:
 
3971
  name: MTEB STS14
 
 
3972
  type: mteb/sts14-sts
3973
+ config: default
3974
+ split: test
3975
+ revision: 6031580fec1f6af667f0bd2da0a551cf4f0b2375
3976
  metrics:
3977
  - type: cosine_pearson
3978
  value: 86.42029843639123
 
3992
  value: 86.42029843639123
3993
  - type: spearman
3994
  value: 85.0707889220723
3995
+ - task:
3996
  type: STS
3997
+ dataset:
 
3998
  name: MTEB STS15
 
 
3999
  type: mteb/sts15-sts
4000
+ config: default
4001
+ split: test
4002
+ revision: ae752c7c21bf194d8b67fd573edf7ae58183cbe3
4003
  metrics:
4004
  - type: cosine_pearson
4005
  value: 88.3660081271444
 
4019
  value: 88.3660081271444
4020
  - type: spearman
4021
  value: 89.39375083609528
4022
+ - task:
4023
  type: STS
4024
+ dataset:
 
4025
  name: MTEB STS16
 
 
4026
  type: mteb/sts16-sts
4027
+ config: default
4028
+ split: test
4029
+ revision: 4d8694f8f0e0100860b497b999b3dbed754a0513
4030
  metrics:
4031
  - type: cosine_pearson
4032
  value: 85.60708247171874
 
4046
  value: 85.60708247171874
4047
  - type: spearman
4048
  value: 87.15234952832193
4049
+ - task:
4050
  type: STS
4051
+ dataset:
 
4052
  name: MTEB STS17 (en-en)
 
 
4053
  type: mteb/sts17-crosslingual-sts
4054
+ config: en-en
4055
+ split: test
4056
+ revision: faeb762787bd10488a50c8b5be4a3b82e411949c
4057
  metrics:
4058
  - type: cosine_pearson
4059
  value: 91.25898556808458
 
4073
  value: 91.25898556808458
4074
  - type: spearman
4075
  value: 91.35372390581641
4076
+ - task:
4077
  type: STS
4078
+ dataset:
 
4079
  name: MTEB STS22 (en)
 
 
4080
  type: mteb/sts22-crosslingual-sts
4081
+ config: en
4082
+ split: test
4083
+ revision: de9d86b3b84231dc21f76c7b7af1f28e2f57f6e3
4084
  metrics:
4085
  - type: cosine_pearson
4086
  value: 67.61637111515797
 
4100
  value: 67.61637111515797
4101
  - type: spearman
4102
  value: 68.10379096526697
4103
+ - task:
4104
  type: STS
4105
+ dataset:
 
4106
  name: MTEB STSBenchmark
 
 
4107
  type: mteb/stsbenchmark-sts
4108
+ config: default
4109
+ split: test
4110
+ revision: b0fddb56ed78048fa8b90373c8a3cfc37b684831
4111
  metrics:
4112
  - type: cosine_pearson
4113
  value: 87.81592853782297
 
4127
  value: 87.81592853782297
4128
  - type: spearman
4129
  value: 88.2302550329183
4130
+ - task:
4131
+ type: Reranking
4132
+ dataset:
 
4133
  name: MTEB SciDocsRR
 
 
4134
  type: mteb/scidocs-reranking
4135
+ config: default
4136
+ split: test
4137
+ revision: d3c5e1fc0b855ab6097bf1cda04dd73947d7caab
4138
  metrics:
4139
  - type: main_score
4140
  value: 89.196009707431
 
4154
  value: 86.38341077184032
4155
  - type: nAUC_mrr_std
4156
  value: 75.38945014727746
4157
+ - task:
4158
+ type: Retrieval
4159
+ dataset:
 
4160
  name: MTEB SciFact
 
 
4161
  type: mteb/scifact
4162
+ config: default
4163
+ split: test
4164
+ revision: 0228b52cf27578f30900b9e5271d331663a030d7
4165
  metrics:
4166
  - type: main_score
4167
  value: 80.08999999999999
 
4445
  value: 80.972
4446
  - type: recall_at_5
4447
  value: 89.90599999999999
4448
+ - task:
4449
+ type: PairClassification
4450
+ dataset:
 
4451
  name: MTEB SprintDuplicateQuestions
 
 
4452
  type: mteb/sprintduplicatequestions-pairclassification
4453
+ config: default
4454
+ split: test
4455
+ revision: d66bd1f72af766a5cc4b0ca5e00c162f89e8cc46
4456
  metrics:
4457
  - type: cosine_accuracy
4458
  value: 99.81881188118813
 
4534
  value: 92.59645464025026
4535
  - type: similarity_recall
4536
  value: 88.8
4537
+ - task:
4538
+ type: Clustering
4539
+ dataset:
 
4540
  name: MTEB StackExchangeClustering
 
 
4541
  type: mteb/stackexchange-clustering
4542
+ config: default
4543
+ split: test
4544
+ revision: 6cbc1f7b2bc0622f2e39d2c77fa502909748c259
4545
  metrics:
4546
  - type: main_score
4547
  value: 80.28558559137414
 
4549
  value: 80.28558559137414
4550
  - type: v_measure_std
4551
  value: 2.795276520287584
4552
+ - task:
4553
  type: Clustering
4554
+ dataset:
 
4555
  name: MTEB StackExchangeClusteringP2P
 
 
4556
  type: mteb/stackexchange-clustering-p2p
4557
+ config: default
4558
+ split: test
4559
+ revision: 815ca46b2622cec33ccafc3735d572c266efdb44
4560
  metrics:
4561
  - type: main_score
4562
  value: 49.57135582416209
 
4564
  value: 49.57135582416209
4565
  - type: v_measure_std
4566
  value: 1.6414135468423754
4567
+ - task:
4568
+ type: Reranking
4569
+ dataset:
 
4570
  name: MTEB StackOverflowDupQuestions
 
 
4571
  type: mteb/stackoverflowdupquestions-reranking
4572
+ config: default
4573
+ split: test
4574
+ revision: e185fbe320c72810689fc5848eb6114e1ef5ec69
4575
  metrics:
4576
  - type: main_score
4577
  value: 55.253002583598644
 
4591
  value: 10.586310195339053
4592
  - type: nAUC_mrr_std
4593
  value: 8.47326494370076
4594
+ - task:
4595
+ type: Summarization
4596
+ dataset:
 
4597
  name: MTEB SummEval
 
 
4598
  type: mteb/summeval
4599
+ config: default
4600
+ split: test
4601
+ revision: cda12ad7615edc362dbf25a00fdd61d3b1eaf93c
4602
  metrics:
4603
  - type: cosine_pearson
4604
  value: 31.19874648747059
 
4614
  value: 31.19874648747059
4615
  - type: spearman
4616
  value: 31.493550648844863
4617
+ - task:
4618
+ type: Retrieval
4619
+ dataset:
 
4620
  name: MTEB TRECCOVID
 
 
4621
  type: mteb/trec-covid
4622
+ config: default
4623
+ split: test
4624
+ revision: bb9466bac8153a0349341eb1b22e06409e78ef4e
4625
  metrics:
4626
  - type: main_score
4627
  value: 85.983
 
4905
  value: 0.7250000000000001
4906
  - type: recall_at_5
4907
  value: 1.1820000000000002
4908
+ - task:
4909
  type: Retrieval
4910
+ dataset:
 
4911
  name: MTEB Touche2020
 
 
4912
  type: mteb/touche2020
4913
+ config: default
4914
+ split: test
4915
+ revision: a34f9a33db75fa0cbb21bb5cfc3dae8dc8bec93f
4916
  metrics:
4917
  - type: main_score
4918
  value: 29.944
 
5196
  value: 7.383000000000001
5197
  - type: recall_at_5
5198
  value: 11.434
5199
+ - task:
5200
+ type: Classification
5201
+ dataset:
 
5202
  name: MTEB ToxicConversationsClassification
 
 
5203
  type: mteb/toxic_conversations_50k
5204
+ config: default
5205
+ split: test
5206
+ revision: edfaf9da55d3dd50d43143d90c1ac476895ae6de
5207
  metrics:
5208
  - type: accuracy
5209
  value: 88.759765625
 
5217
  value: 90.54372649306606
5218
  - type: main_score
5219
  value: 88.759765625
5220
+ - task:
5221
  type: Classification
5222
+ dataset:
 
5223
  name: MTEB TweetSentimentExtractionClassification
 
 
5224
  type: mteb/tweet_sentiment_extraction
5225
+ config: default
5226
+ split: test
5227
+ revision: d604517c81ca91fe16a244d1248fc021f9ecee7a
5228
  metrics:
5229
  - type: accuracy
5230
  value: 74.8443689869836
 
5234
  value: 74.7369003946243
5235
  - type: main_score
5236
  value: 74.8443689869836
5237
+ - task:
5238
+ type: Clustering
5239
+ dataset:
 
5240
  name: MTEB TwentyNewsgroupsClustering
 
 
5241
  type: mteb/twentynewsgroups-clustering
5242
+ config: default
5243
+ split: test
5244
+ revision: 6125ec4e24fa026cec8a478383ee943acfbd5449
5245
  metrics:
5246
  - type: main_score
5247
  value: 61.42918790942448
 
5249
  value: 61.42918790942448
5250
  - type: v_measure_std
5251
  value: 1.0156550098843082
5252
+ - task:
5253
+ type: PairClassification
5254
+ dataset:
 
5255
  name: MTEB TwitterSemEval2015
 
 
5256
  type: mteb/twittersemeval2015-pairclassification
5257
+ config: default
5258
+ split: test
5259
+ revision: 70970daeab8776df92f5ea462b6173c0b46fd2d1
5260
  metrics:
5261
  - type: cosine_accuracy
5262
  value: 88.22197055492639
 
5338
  value: 71.64922770303936
5339
  - type: similarity_recall
5340
  value: 75.8839050131926
5341
+ - task:
5342
  type: PairClassification
5343
+ dataset:
 
5344
  name: MTEB TwitterURLCorpus
 
 
5345
  type: mteb/twitterurlcorpus-pairclassification
5346
+ config: default
5347
+ split: test
5348
+ revision: 8b6510b0b1fa4e4c4f879467980e9be563ec1cdf
5349
  metrics:
5350
  - type: cosine_accuracy
5351
  value: 89.88628866379477
 
5427
  value: 76.93126197063205
5428
  - type: similarity_recall
5429
  value: 83.50015398829689
 
 
 
 
 
 
 
 
5430
  ---
5431
 
5432
 
onnx/added_tokens.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "<|endoftext|>": 151643,
3
+ "<|im_end|>": 151645,
4
+ "<|im_start|>": 151644
5
+ }
onnx/config.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_attn_implementation_autoset": true,
3
+ "architectures": [
4
+ "Qwen2ForCausalLM"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "auto_map": {
8
+ "AutoModel": "NovaSearch/stella_en_1.5B_v5--modeling_qwen.Qwen2Model",
9
+ "AutoModelForCausalLM": "NovaSearch/stella_en_1.5B_v5--modeling_qwen.Qwen2ForCausalLM",
10
+ "AutoModelForSequenceClassification": "NovaSearch/stella_en_1.5B_v5--modeling_qwen.Qwen2ForSequenceClassification"
11
+ },
12
+ "bos_token_id": 151643,
13
+ "eos_token_id": 151643,
14
+ "export_model_type": "transformer",
15
+ "hidden_act": "silu",
16
+ "hidden_size": 1536,
17
+ "initializer_range": 0.02,
18
+ "intermediate_size": 8960,
19
+ "max_position_embeddings": 131072,
20
+ "max_window_layers": 21,
21
+ "model_type": "qwen2",
22
+ "num_attention_heads": 12,
23
+ "num_hidden_layers": 28,
24
+ "num_key_value_heads": 2,
25
+ "rms_norm_eps": 1e-06,
26
+ "rope_scaling": null,
27
+ "rope_theta": 1000000.0,
28
+ "sliding_window": 131072,
29
+ "tie_word_embeddings": false,
30
+ "torch_dtype": "float32",
31
+ "transformers_version": "4.51.3",
32
+ "use_cache": true,
33
+ "use_sliding_window": false,
34
+ "vocab_size": 151646
35
+ }
onnx/merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
onnx/model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8b8d12c8210ae19b00bbdca6ddfe3d70da0d46312c72bcfa1fd6e3707cfdd7d2
3
- size 874851
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b44c618d7f278c8b171a78c6635b844caa144556b46d144ecaaac8562f6f927
3
+ size 1430611
onnx/model.onnx_data CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4d9d0ac35b704186bd6bf7d969ebccc7929e0cb13acae9f088a061e433141f29
3
- size 6313588736
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b96b4485d9715a6efb678336ed8069976eca6d7b85f05188f3142ffb0561f667
3
+ size 6179371008
onnx/special_tokens_map.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<|im_start|>",
4
+ "<|im_end|>"
5
+ ],
6
+ "eos_token": {
7
+ "content": "<|endoftext|>",
8
+ "lstrip": false,
9
+ "normalized": false,
10
+ "rstrip": false,
11
+ "single_word": false
12
+ },
13
+ "pad_token": {
14
+ "content": "<|endoftext|>",
15
+ "lstrip": false,
16
+ "normalized": false,
17
+ "rstrip": false,
18
+ "single_word": false
19
+ }
20
+ }
onnx/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8372feaa064372d176aff57e8f1e64f194814bb074519104f64c66a2825f091
3
+ size 11419037
onnx/tokenizer_config.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_eos_token": true,
3
+ "add_prefix_space": false,
4
+ "added_tokens_decoder": {
5
+ "151643": {
6
+ "content": "<|endoftext|>",
7
+ "lstrip": false,
8
+ "normalized": false,
9
+ "rstrip": false,
10
+ "single_word": false,
11
+ "special": true
12
+ },
13
+ "151644": {
14
+ "content": "<|im_start|>",
15
+ "lstrip": false,
16
+ "normalized": false,
17
+ "rstrip": false,
18
+ "single_word": false,
19
+ "special": true
20
+ },
21
+ "151645": {
22
+ "content": "<|im_end|>",
23
+ "lstrip": false,
24
+ "normalized": false,
25
+ "rstrip": false,
26
+ "single_word": false,
27
+ "special": true
28
+ }
29
+ },
30
+ "additional_special_tokens": [
31
+ "<|im_start|>",
32
+ "<|im_end|>"
33
+ ],
34
+ "auto_map": {
35
+ "AutoTokenizer": [
36
+ "NovaSearch/stella_en_1.5B_v5--tokenization_qwen.Qwen2Tokenizer",
37
+ "NovaSearch/stella_en_1.5B_v5--tokenization_qwen.Qwen2TokenizerFast"
38
+ ]
39
+ },
40
+ "bos_token": null,
41
+ "chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
42
+ "clean_up_tokenization_spaces": false,
43
+ "eos_token": "<|endoftext|>",
44
+ "errors": "replace",
45
+ "extra_special_tokens": {},
46
+ "model_max_length": 32768,
47
+ "pad_token": "<|endoftext|>",
48
+ "split_special_tokens": false,
49
+ "tokenizer_class": "Qwen2Tokenizer",
50
+ "unk_token": null
51
+ }
onnx/vocab.json ADDED
The diff for this file is too large to render. See raw diff