Skip to content

Commit d681f07

Browse files
committed
Dump on disk (and version) experimental results
1 parent 2b638ab commit d681f07

File tree

2 files changed

+578
-123
lines changed

2 files changed

+578
-123
lines changed

expes/tokenizers_fertilities.json

Lines changed: 72 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,72 @@
1+
{
2+
"wikimedia/wikipedia/20231101.en": {
3+
"gpt-4": 1.3809220628440881,
4+
"google/gemma-7b": 1.3943485262724242,
5+
"microsoft/Phi-3-medium-4k-instruct": 1.64767237182128,
6+
"mistralai/Mistral-7B-v0.1": 1.6146211752368824,
7+
"meta-llama/Meta-Llama-3-8B-Instruct": 1.3791118934371995,
8+
"Qwen/Qwen2.5-7B": 1.4221377476499009,
9+
"bigscience/bloom-7b1": 1.3755539742581426,
10+
"croissantllm/CroissantLLMBase": 1.5767012471443018,
11+
"utter-project/EuroLLM-9B": 1.5209480294121318,
12+
"OpenLLM-France/Lucie-7B": 1.5008114552513638,
13+
"CohereForAI/c4ai-command-r-plus": 1.3982310275520267,
14+
"allenai/OLMo-2-1124-7B-Instruct": 1.4215510030835299
15+
},
16+
"wikimedia/wikipedia/20231101.fr": {
17+
"gpt-4": 1.8529395175694223,
18+
"google/gemma-7b": 1.6441557464889356,
19+
"microsoft/Phi-3-medium-4k-instruct": 1.996634642501269,
20+
"mistralai/Mistral-7B-v0.1": 2.0805805711707306,
21+
"meta-llama/Meta-Llama-3-8B-Instruct": 1.8492545451127114,
22+
"Qwen/Qwen2.5-7B": 1.8761398033427965,
23+
"bigscience/bloom-7b1": 1.422223893411545,
24+
"croissantllm/CroissantLLMBase": 1.5804959672112655,
25+
"utter-project/EuroLLM-9B": 1.734124223680335,
26+
"OpenLLM-France/Lucie-7B": 1.5905920397074582,
27+
"CohereForAI/c4ai-command-r-plus": 1.586136231175619,
28+
"allenai/OLMo-2-1124-7B-Instruct": 1.9298413832434025
29+
},
30+
"wikimedia/wikipedia/20231101.de": {
31+
"gpt-4": 2.7174367093937914,
32+
"google/gemma-7b": 2.438275867877175,
33+
"microsoft/Phi-3-medium-4k-instruct": 2.993447758931429,
34+
"mistralai/Mistral-7B-v0.1": 3.1795634085128603,
35+
"meta-llama/Meta-Llama-3-8B-Instruct": 2.7094359008910374,
36+
"Qwen/Qwen2.5-7B": 2.90382185989321,
37+
"bigscience/bloom-7b1": 2.6884569388064476,
38+
"croissantllm/CroissantLLMBase": 3.4861880779531407,
39+
"utter-project/EuroLLM-9B": 2.580058616449662,
40+
"OpenLLM-France/Lucie-7B": 2.7991207532550657,
41+
"CohereForAI/c4ai-command-r-plus": 2.4974144755680574,
42+
"allenai/OLMo-2-1124-7B-Instruct": 2.7920463541578937
43+
},
44+
"wikimedia/wikipedia/20231101.es": {
45+
"gpt-4": 1.8225358585955305,
46+
"google/gemma-7b": 1.5613474022865241,
47+
"microsoft/Phi-3-medium-4k-instruct": 1.9952571541648314,
48+
"mistralai/Mistral-7B-v0.1": 2.0873181536733116,
49+
"meta-llama/Meta-Llama-3-8B-Instruct": 1.815680116432716,
50+
"Qwen/Qwen2.5-7B": 1.8497290258335088,
51+
"bigscience/bloom-7b1": 1.458626170550949,
52+
"croissantllm/CroissantLLMBase": 2.26073523685504,
53+
"utter-project/EuroLLM-9B": 1.6609343980798816,
54+
"OpenLLM-France/Lucie-7B": 1.7532315823742317,
55+
"CohereForAI/c4ai-command-r-plus": 1.5383225773505174,
56+
"allenai/OLMo-2-1124-7B-Instruct": 1.8630702745488552
57+
},
58+
"wikimedia/wikipedia/20231101.it": {
59+
"gpt-4": 2.0160554015873338,
60+
"google/gemma-7b": 1.7640779775993094,
61+
"microsoft/Phi-3-medium-4k-instruct": 2.155867537879554,
62+
"mistralai/Mistral-7B-v0.1": 2.2668730065610694,
63+
"meta-llama/Meta-Llama-3-8B-Instruct": 2.0103304809877343,
64+
"Qwen/Qwen2.5-7B": 2.0686855609275856,
65+
"bigscience/bloom-7b1": 1.9323933404810552,
66+
"croissantllm/CroissantLLMBase": 2.366233083163069,
67+
"utter-project/EuroLLM-9B": 1.7834779735534292,
68+
"OpenLLM-France/Lucie-7B": 1.8978887248059664,
69+
"CohereForAI/c4ai-command-r-plus": 1.6885279064592478,
70+
"allenai/OLMo-2-1124-7B-Instruct": 2.074444197196205
71+
}
72+
}

0 commit comments

Comments
 (0)