library_name: transformers
model-index:
- name: Llama-3-8B-Dolphin-Portuguese-v0.3
results:
- task:
type: 文本生成
name: 文本生成
dataset:
name: ENEM挑战赛(无图像)
type: eduagarcia/enem_challenge
split: 训练集
args:
num_few_shot: 3
metrics:
- type: 准确率
value: 68.86
name: 准确率
source:
url: >-
https://huggingface.co/spaces/eduagarcia/open_pt_llm_leaderboard?query=adalbertojunior/Llama-3-8B-Dolphin-Portuguese-v0.3
name: 葡萄牙语开源大模型排行榜
- task:
type: 文本生成
name: 文本生成
dataset:
name: BLUEX(无图像)
type: eduagarcia-temp/BLUEX_without_images
split: 训练集
args:
num_few_shot: 3
metrics:
- type: 准确率
value: 57.86
name: 准确率
source:
url: >-
https://huggingface.co/spaces/eduagarcia/open_pt_llm_leaderboard?query=adalbertojunior/Llama-3-8B-Dolphin-Portuguese-v0.3
name: 葡萄牙语开源大模型排行榜
- task:
type: 文本生成
name: 文本生成
dataset:
name: OAB律师资格考试
type: eduagarcia/oab_exams
split: 训练集
args:
num_few_shot: 3
metrics:
- type: 准确率
value: 61.91
name: 准确率
source:
url: >-
https://huggingface.co/spaces/eduagarcia/open_pt_llm_leaderboard?query=adalbertojunior/Llama-3-8B-Dolphin-Portuguese-v0.3
name: 葡萄牙语开源大模型排行榜
- task:
type: 文本生成
name: 文本生成
dataset:
name: Assin2 RTE
type: assin2
split: 测试集
args:
num_few_shot: 15
metrics:
- type: 宏观F1值
value: 93.05
name: 宏观F1值
source:
url: >-
https://huggingface.co/spaces/eduagarcia/open_pt_llm_leaderboard?query=adalbertojunior/Llama-3-8B-Dolphin-Portuguese-v0.3
name: 葡萄牙语开源大模型排行榜
- task:
type: 文本生成
name: 文本生成
dataset:
name: Assin2 STS
type: eduagarcia/portuguese_benchmark
split: 测试集
args:
num_few_shot: 15
metrics:
- type: 皮尔逊系数
value: 76.48
name: 皮尔逊系数
source:
url: >-
https://huggingface.co/spaces/eduagarcia/open_pt_llm_leaderboard?query=adalbertojunior/Llama-3-8B-Dolphin-Portuguese-v0.3
name: 葡萄牙语开源大模型排行榜
- task:
type: 文本生成
name: 文本生成
dataset:
name: FaQuAD自然语言推理
type: ruanchaves/faquad-nli
split: 测试集
args:
num_few_shot: 15
metrics:
- type: 宏观F1值
value: 76.78
name: 宏观F1值
source:
url: >-
https://huggingface.co/spaces/eduagarcia/open_pt_llm_leaderboard?query=adalbertojunior/Llama-3-8B-Dolphin-Portuguese-v0.3
name: 葡萄牙语开源大模型排行榜
- task:
type: 文本生成
name: 文本生成
dataset:
name: HateBR二元分类
type: ruanchaves/hatebr
split: 测试集
args:
num_few_shot: 25
metrics:
- type: 宏观F1值
value: 83.25
name: 宏观F1值
source:
url: >-
https://huggingface.co/spaces/eduagarcia/open_pt_llm_leaderboard?query=adalbertojunior/Llama-3-8B-Dolphin-Portuguese-v0.3
name: 葡萄牙语开源大模型排行榜
- task:
type: 文本生成
name: 文本生成
dataset:
name: 葡萄牙语仇恨言论二元分类
type: hate_speech_portuguese
split: 测试集
args:
num_few_shot: 25
metrics:
- type: 宏观F1值
value: 68.85
name: 宏观F1值
source:
url: >-
https://huggingface.co/spaces/eduagarcia/open_pt_llm_leaderboard?query=adalbertojunior/Llama-3-8B-Dolphin-Portuguese-v0.3
name: 葡萄牙语开源大模型排行榜
- task:
type: 文本生成
name: 文本生成
dataset:
name: tweetSentBR情感分析
type: eduagarcia/tweetsentbr_fewshot
split: 测试集
args:
num_few_shot: 25
metrics:
- type: 宏观F1值
value: 71.3
name: 宏观F1值
source:
url: >-
https://huggingface.co/spaces/eduagarcia/open_pt_llm_leaderboard?query=adalbertojunior/Llama-3-8B-Dolphin-Portuguese-v0.3
name: 葡萄牙语开源大模型排行榜
datasets:
- adalbertojunior/dolphin_portuguese_legal
language:
- pt
模型卡片