pipeline_tag: 句子相似度
tags:
- 句子转换器
- 特征提取
- 句子相似度
- MTEB
model-index:
- name: SGPT-125M加权平均-msmarco-specb-bitfit
results:
- task:
type: 分类
dataset:
type: mteb/amazon_counterfactual
name: MTEB Amazon反事实分类 (en)
config: en
split: 测试集
revision: 2d8a100785abf0ae21420d2a55b0c56e3e1ea996
metrics:
- type: 准确率
value: 61.23880597014926
- type: 平均精度
value: 25.854431650388644
- type: F1分数
value: 55.751862762818604
- task:
type: 分类
dataset:
type: mteb/amazon_counterfactual
name: MTEB Amazon反事实分类 (de)
config: de
split: 测试集
revision: 2d8a100785abf0ae21420d2a55b0c56e3e1ea996
metrics:
- type: 准确率
value: 56.88436830835117
- type: 平均精度
value: 72.67279104379772
- type: F1分数
value: 54.449840243786404
- task:
type: 分类
dataset:
type: mteb/amazon_counterfactual
name: MTEB Amazon反事实分类 (en-ext)
config: en-ext
split: 测试集
revision: 2d8a100785abf0ae21420d2a55b0c56e3e1ea996
metrics:
- type: 准确率
value: 58.27586206896551
- type: 平均精度
value: 14.067357642500387
- type: F1分数
value: 48.172318518691334
- task:
type: 分类
dataset:
type: mteb/amazon_counterfactual
name: MTEB Amazon反事实分类 (ja)
config: ja
split: 测试集
revision: 2d8a100785abf0ae21420d2a55b0c56e3e1ea996
metrics:
- type: 准确率
value: 54.64668094218415
- type: 平均精度
value: 11.776694555054965
- type: F1分数
value: 44.526622834078765
- task:
type: 分类
dataset:
type: mteb/amazon_polarity
name: MTEB Amazon极性分类
config: 默认
split: 测试集
revision: 80714f8dcf8cefc218ef4f8c5a966dd83f75a0e1
metrics:
- type: 准确率
value: 65.401225
- type: 平均精度
value: 60.22809958678552
- type: F1分数
value: 65.0251824898292
- task:
type: 分类
dataset:
type: mteb/amazon_reviews_multi
name: MTEB Amazon评论分类 (en)
config: en
split: 测试集
revision: c379a6705fec24a2493fa68e011692605f44e119
metrics:
- type: 准确率
value: 31.165999999999993
- type: F1分数
value: 30.908870050167437
- task:
type: 分类
dataset:
type: mteb/amazon_reviews_multi
name: MTEB Amazon评论分类 (de)
config: de
split: 测试集
revision: c379a6705fec24a2493fa68e011692605f44e119
metrics:
- type: 准确率
value: 24.79
- type: F1分数
value: 24.5833598854121
- task:
type: 分类
dataset:
type: mteb/amazon_reviews_multi
name: MTEB Amazon评论分类 (es)
config: es
split: 测试集
revision: c379a6705fec24a2493fa68e011692605f44e119
metrics:
- type: 准确率
value: 26.643999999999995
- type: F1分数
value: 26.39012792213563
- task:
type: 分类
dataset:
type: mteb/amazon_reviews_multi
name: MTEB Amazon评论分类 (fr)
config: fr
split: 测试集
revision: c379a6705fec24a2493fa68e011692605f44e119
metrics:
- type: 准确率
value: 26.386000000000003
- type: F1分数
value: 26.276867791454873
- task:
type: 分类
dataset:
type: mteb/amazon_reviews_multi
name: MTEB Amazon评论分类 (ja)
config: ja
split: 测试集
revision: c379a6705fec24a2493fa68e011692605f44e119
metrics:
- type: 准确率
value: 22.078000000000003
- type: F1分数
value: 21.797960290226843
- task:
type: 分类
dataset:
type: mteb/amazon_reviews_multi
name: MTEB Amazon评论分类 (zh)
config: zh
split: 测试集
revision: c379a6705fec24a2493fa68e011692605f44e119
metrics:
- type: 准确率
value: 24.274
- type: F1分数
value: 23.887054434822627
- task:
type: 检索
dataset:
type: arguana
name: MTEB ArguAna
config: 默认
split: 测试集
revision: 5b3e3697907184a9b77a3c99ee9ea1a9cbb1e4e3
metrics:
- type: 平均精度@1
value: 22.404
- type: 平均精度@10
value: 36.845
- type: 平均精度@100
value: 37.945
- type: 平均精度@1000
value: 37.966
- type: 平均精度@3
value: 31.78
- type: 平均精度@5
value: 34.608
- type: 平均倒数排名@1
value: 22.902
- type: 平均倒数排名@10
value: 37.034
- type: 平均倒数排名@100
value: 38.134
- type: 平均倒数排名@1000
value: 38.155
- type: 平均倒数排名@3
value: 31.935000000000002
- type: 平均倒数排名@5
value: 34.812
- type: 标准化折损累积增益@1
value: 22.404
- type: 标准化折损累积增益@10
value: 45.425
- type: 标准化折损累积增益@100
value: 50.354
- type: 标准化折损累积增益@1000
value: 50.873999999999995
- type: 标准化折损累积增益@3
value: 34.97
- type: 标准化折损累积增益@5
value: 40.081
- type: 精确率@1
value: 22.404
- type: 精确率@10
value: 7.303999999999999
- type: 精确率@100
value: 0.951
- type: 精确率@1000
value: 0.099
- type: 精确率@3
value: 14.746
- type: 精确率@5
value: 11.337
- type: 召回率@1
value: 22.404
- type: 召回率@10
value: 73.044
- type: 召回率@100
value: 95.092
- type: 召回率@1000
value: 99.075
- type: 召回率@3
value: 44.239
- type: 召回率@5
value: 56.686
- task:
type: 聚类
dataset:
type: mteb/arxiv-clustering-p2p
name: MTEB Arxiv聚类P2P
config: 默认
split: 测试集
revision: 0bbdb47bcbe3a90093699aefeed338a0f28a7ee8
metrics:
- type: V度量
value: 39.70858340673288
- task:
type: 聚类
dataset:
type: mteb/arxiv-clustering-s2s
name: MTEB Arxiv聚类S2S
config: 默认
split: 测试集
revision: b73bd54100e5abfa6e3a23dcafb46fe4d2438dc3
metrics:
- type: V度量
value: 28.242847713721048
- task:
type: 重排序
dataset:
type: mteb/askubuntudupquestions-reranking
name: MTEB AskUbuntu重复问题
config: 默认
split: 测试集
revision: 4d853f94cd57d85ec13805aeeac3ae3e5eb4c49c
metrics:
- type: 平均精度
value: 55.83700395192393
- type: 平均倒数排名
value: 70.3891307215407
- task:
type: STS
dataset:
type: mteb/biosses-sts
name: MTEB BIOSSES
config: 默认
split: 测试集
revision: 9ee918f184421b6bd48b78f6c714d86546106103
metrics:
- type: 余弦相似度皮尔逊
value: 79.25366801756223
- type: 余弦相似度斯皮尔曼
value: 75.20954502580506
- type: 欧氏距离皮尔逊
value: 78.79900722991617
- type: 欧氏距离斯皮尔曼
value: 77.79996549607588
- type: 曼哈顿距离皮尔逊
value: 78.18408109480399
- type: 曼哈顿距离斯皮尔曼
value: 76.85958262303106
- task:
type: 分类
dataset:
type: mteb/banking77
name: MTEB Banking77分类
config: 默认
split: 测试集
revision: 44fa15921b4c889113cc5df03dd4901b49161ab7
metrics:
- type: 准确率
value: 77.70454545454545
- type: F1分数
value: 77.6929000113803
- task:
type: 聚类
dataset:
type: mteb/biorxiv-clustering-p2p
name: MTEB Biorxiv聚类P2P
config: 默认
split: 测试集
revision: 11d0121201d1f1f280e8cc8f3d98fb9c4d9f9c55
metrics:
- type: V度量
value: 33.63260395543984
- task:
type: 聚类
dataset:
type: mteb/biorxiv-clustering-s2s
name: MTEB Biorxiv聚类S2S
config: 默认
split: 测试集
revision: c0fab014e1bcb8d3a5e31b2088972a1e01547dc1