-
Notifications
You must be signed in to change notification settings - Fork 0
/
config.json
155 lines (154 loc) · 5.92 KB
/
config.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
[
{
"source_language": "Kashmiri",
"source_language_code": "kas",
"target_language": "Urdu",
"target_language_code": "urd",
"corpus": "data/corpus/kswiki-20221201.txt",
"source_wordlist": "data/wordlists/kswiki-20221201_wordlist.txt",
"target_dictionary": "data/dictionary/Urdu.txt",
"common_words": "data/common/Kashmiri_Urdu_common.txt",
"script_map": "data/scripts/Kashmiri-Urdu.tsv",
"datasets": "data/datasets/Kashmiri-Urdu",
"FLORES": "data/machine_translation/FLORES200/kas_Arab.devtest",
"FLORES_dataset": "data/machine_translation/Kashmiri-Urdu"
},
{
"source_language": "Sindhi",
"source_language_code": "snd",
"target_language": "Urdu",
"target_language_code": "urd",
"corpus": "data/corpus/sdwiki-20221201.txt",
"source_wordlist": "data/wordlists/sdnwiki-20221201_wordlist.txt",
"target_dictionary": "data/dictionary/Urdu.txt",
"common_words": "data/common/Sindhi_Urdu_common.txt",
"script_map": "data/scripts/Sindhi-Urdu.tsv",
"datasets": "data/datasets/Sindhi-Urdu",
"FLORES": "data/machine_translation/FLORES200/snd_Arab.devtest",
"FLORES_dataset": "data/machine_translation/Sindhi-Urdu"
},
{
"source_language": "Sorani",
"source_language_code": "ckb",
"target_language": "Arabic",
"target_language_code": "arb",
"corpus": "data/corpus/ckb_Pewan_AS_ckb_clean_full.txt",
"source_wordlist": "data/wordlist/ckb_Pewan_corpus_wordlist.txt",
"target_dictionary": "data/dictionary/Arabic.txt",
"common_words": "data/common/Sorani_Arabic_common.txt",
"script_map": "data/scripts/Kurdish-Arabic.tsv",
"datasets": "data/datasets/Sorani-Arabic",
"FLORES": "data/machine_translation/FLORES200/ckb_Arab.devtest",
"FLORES_dataset": "data/machine_translation/Sorani-Arabic"
},
{
"source_language": "Kurmanji",
"source_language_code": "kmr",
"target_language": "Arabic",
"target_language_code": "arb",
"corpus": "data/corpus/kmr-arab_corpus.txt",
"source_wordlist": "data/wordlists/kmr-arab_corpus_wordlist.txt",
"target_dictionary": "data/dictionary/Arabic.txt",
"common_words": "data/common/Kurmanji_Arabic_common.txt",
"script_map": "data/scripts/Kurdish-Arabic.tsv",
"datasets": "data/datasets/Kurmanji-Arabic"
},
{
"source_language": "Gorani",
"source_language_code": "hac",
"target_language": "Arabic",
"target_language_code": "arb",
"corpus": "data/corpus/hac_arb_all.txt",
"source_wordlist": "data/wordlists/hac_corpus_wordlist.txt",
"target_dictionary": "data/dictionary/Arabic.txt",
"common_words": "data/common/Gorani_Arabic_common.txt",
"script_map": "data/scripts/Gorani-Arabic.tsv",
"datasets": "data/datasets/Gorani-Arabic"
},
{
"source_language": "Sorani",
"source_language_code": "ckb",
"target_language": "Persian",
"target_language_code": "fas",
"corpus": "data/corpus/ckb_Pewan_AS_ckb_clean_full.txt",
"source_wordlist": "data/wordlist/ckb_Pewan_corpus_wordlist.txt",
"target_dictionary": "data/dictionary/Persian.txt",
"common_words": "data/common/Sorani_Persian_common.txt",
"script_map": "data/scripts/Kurdish-Persian.tsv",
"datasets": "data/datasets/Sorani-Persian",
"FLORES": "data/machine_translation/FLORES200/ckb_Arab.devtest",
"FLORES_dataset": "data/machine_translation/Sorani-Persian"
},
{
"source_language": "Kurmanji",
"source_language_code": "kmr",
"target_language": "Persian",
"target_language_code": "fas",
"corpus": "data/corpus/kmr-arab_corpus.txt",
"source_wordlist": "data/wordlist/kmr-arab_corpus_wordlist.txt",
"target_dictionary": "data/dictionary/Persian.txt",
"common_words": "data/common/Kurmanji_Persian_common.txt",
"script_map": "data/scripts/Kurdish-Persian.tsv",
"datasets": "data/datasets/Kurmanji-Persian"
},
{
"source_language": "Gorani",
"source_language_code": "hac",
"target_language": "Persian",
"target_language_code": "fas",
"corpus": "data/corpus/hac_arb_all.txt",
"source_wordlist": "data/wordlists/hac_corpus_wordlist.txt",
"target_dictionary": "data/dictionary/Persian.txt",
"common_words": "data/common/Gorani_Persian_common.txt",
"script_map": "data/scripts/Gorani-Persian.tsv",
"datasets": "data/datasets/Gorani-Persian"
},
{
"source_language": "Gorani",
"source_language_code": "hac",
"target_language": "Sorani",
"target_language_code": "ckb",
"corpus": "data/corpus/hac_arb_all.txt",
"source_wordlist": "data/wordlists/hac_corpus_wordlist.txt",
"target_dictionary": "data/dictionary/SoraniKurdish.txt",
"common_words": "data/common/Gorani_Sorani_common.txt",
"script_map": "data/scripts/Gorani-Kurdish.tsv",
"datasets": "data/datasets/Gorani-Sorani"
},
{
"source_language": "AzeriTurkish",
"source_language_code": "azb",
"target_language": "Persian",
"target_language_code": "fas",
"corpus": "data/corpus/azbwiki-20221201.txt",
"source_wordlist": "data/wordlists/azbwiki-20221201_wordlist.txt",
"target_dictionary": "data/dictionary/Persian.txt",
"common_words": "data/common/AzeriTurkish_Persian_common.txt",
"script_map": "data/scripts/AzeriTurkish-Persian.tsv",
"datasets": "data/datasets/AzeriTurkish-Persian"
},
{
"source_language": "Gilaki",
"source_language_code": "glk",
"target_language": "Persian",
"target_language_code": "fas",
"corpus": "data/corpus/glkwiki-20221201.txt",
"source_wordlist": "data/wordlist/glkwiki-20221201_wordlist.txt",
"target_dictionary": "data/dictionary/Persian.txt",
"common_words": "data/common/Gilaki_Persian_common.txt",
"script_map": "data/scripts/Gilaki-Persian.tsv",
"datasets": "data/datasets/Gilaki-Persian"
},
{
"source_language": "Mazanderani",
"source_language_code": "mzn",
"target_language": "Persian",
"target_language_code": "fas",
"corpus": "data/corpus/mznwiki-20221201.txt",
"source_wordlist": "data/wordlist/mznwiki-20221201_wordlist.txt",
"target_dictionary": "data/dictionary/Persian.txt",
"common_words": "data/common/Mazanderani_Persian_common.txt",
"script_map": "data/scripts/Mazanderani-Persian.tsv",
"datasets": "data/datasets/Mazanderani-Persian"
}
]