de-francophones commited on
Commit
821bb51
·
verified ·
1 Parent(s): b9fe684

Update index.html

Browse files
Files changed (1) hide show
  1. index.html +12 -4
index.html CHANGED
@@ -8,7 +8,7 @@
8
  </head>
9
  <body>
10
  <div>
11
- <h1>Vous trouverez ci-dessous une liste de 131 jeux de données en français mal référencés sur le Hub :<br>
12
  Below is a list of 131 French datasets that are badly referenced on the Hub:</h1>
13
  </div>
14
  <br><br>
@@ -28,6 +28,7 @@
28
  <a href="https://huggingface.co/datasets/AdrienB134/QA_ASN_test">AdrienB134/QA_ASN_test</a><br>
29
  <a href="https://huggingface.co/datasets/AdrienB134/Small-markdown">AdrienB134/Small-markdown</a><br>
30
  <a href="https://huggingface.co/datasets/ahmadSiddiqi/x-stance_fr">ahmadSiddiqi/x-stance_fr</a><br>
 
31
  <a href="https://huggingface.co/datasets/Alwaly/fr_voxpopuli/">Alwaly/fr_voxpopuli/</a><br>
32
  <a href="https://huggingface.co/datasets/Alwaly/french-Wolof-lang-classification">Alwaly/french-Wolof-lang-classification</a><br>
33
  <a href="https://huggingface.co/datasets/Alwaly/frenchToWolof">Alwaly/frenchToWolof</a><br>
@@ -40,7 +41,7 @@
40
  <a href="https://huggingface.co/datasets/babs/unlabelled-french-voxpopuli">babs/unlabelled-french-voxpopuli</a><br>
41
  <a href="https://huggingface.co/datasets/BitTranslate/chatgpt-prompts-French">BitTranslate/chatgpt-prompts-French</a><br>
42
  <a href="https://huggingface.co/datasets/bosbos/french_english_instruct">bosbos/french_english_instruct</a><br>
43
-
44
  <a href="https://huggingface.co/datasets/Databasesprojec/FinStmts_ConsUncons_French_Predict_part1">Databasesprojec/FinStmts_ConsUncons_French_Predict_part1</a><br>
45
  <a href="https://huggingface.co/datasets/Databasesprojec/FinStmts_ConsUncons_French_Predict_part2">Databasesprojec/FinStmts_ConsUncons_French_Predict_part2</a><br>
46
  <a href="https://huggingface.co/datasets/Databasesprojec/FinStmts_ConsUncons_French_SeqClass">Databasesprojec/FinStmts_ConsUncons_French_SeqClass</a><br>
@@ -85,7 +86,9 @@
85
  <a href="https://huggingface.co/datasets/ismailiismail/French_English_2">ismailiismail/French_English_2</a><br>
86
  <a href="https://huggingface.co/datasets/ismailiismail/FrEn_handpicks">ismailiismail/FrEn_handpicks</a><br>
87
  <a href="https://huggingface.co/datasets/ismailiismail/ner">ismailiismail/ner</a><br>
 
88
  <a href="https://huggingface.co/datasets/ismailiismail/paragraphss_paraphrasing">ismailiismail/paragraphss_paraphrasing</a><br>
 
89
  <a href="https://huggingface.co/datasets/ismailiismail/paraphrasing_french_5000">ismailiismail/paraphrasing_french_5000</a><br>
90
 
91
  <a href="https://huggingface.co/datasets/jwang214/arc_french/">jwang214/arc_french/</a><br>
@@ -94,7 +97,8 @@
94
  <a href="https://huggingface.co/datasets/kaitchup/opus-French-to-English">kaitchup/opus-French-to-English</a><br>
95
  <a href="https://huggingface.co/datasets/kloodia/alpaca_french">kloodia/alpaca_french</a><br>
96
 
97
- <a href="https://huggingface.co/datasets/malteos/wikinews">malteos/wikinews</a><br>
 
98
  <a href="https://huggingface.co/datasets/manu/croissant_french_dataset">manu/croissant_french_dataset</a><br>
99
  <a href="https://huggingface.co/datasets/manu/dataset_en_fr">manu/dataset_en_fr</a><br>
100
  <a href="https://huggingface.co/datasets/manu/dataset_en_fr_short">manu/dataset_en_fr_short</a><br>
@@ -120,6 +124,7 @@
120
  <a href="https://huggingface.co/datasets/Mediform/sharegpt-french">Mediform/sharegpt-french</a><br>
121
  <a href="https://huggingface.co/datasets/musts/french">musts/french</a><br>
122
 
 
123
  <a href="https://huggingface.co/datasets/nirantk/french-books">nirantk/french-books</a><br>
124
 
125
  <a href="https://huggingface.co/datasets/odunola/french-audio-preprocessed">odunola/french-audio-preprocessed</a><br>
@@ -131,6 +136,7 @@
131
  <a href="https://huggingface.co/datasets/paulml/chatml-OpenHermes2.5-dpo-binarized-alpha-french">paulml/chatml-OpenHermes2.5-dpo-binarized-alpha-french</a><br>
132
  <a href="https://huggingface.co/datasets/PHBJT/cml-tts-20percent-subset">PHBJT/cml-tts-20percent-subset</a><br>
133
  <a href="https://huggingface.co/datasets/Poulpidot/FrenchHateSpeechSuperset">Poulpidot/FrenchHateSpeechSuperset</a><br>
 
134
 
135
  <a href="https://huggingface.co/datasets/qanastek/ECDC">qanastek/ECDC</a><br>
136
 
@@ -146,7 +152,9 @@
146
  <a href="https://huggingface.co/datasets/shuyuej/French-MMLU-Medical-Genetics-Benchmark">shuyuej/French-MMLU-Medical-Genetics-Benchmark</a><br>
147
  <a href="https://huggingface.co/datasets/shuyuej/French-MMLU-Professional-Medicine-Benchmark">shuyuej/French-MMLU-Professional-Medicine-Benchmark</a><br>
148
  <a href="https://huggingface.co/datasets/startlingadama/bambara-french">startlingadama/bambara-french</a><br>
149
-
 
 
150
  <a href="https://huggingface.co/datasets/Tngarg/french_eng">Tngarg/french_eng</a><br>
151
  <a href="https://huggingface.co/datasets/Tngarg/french_english">Tngarg/french_english</a><br>
152
  <a href="https://huggingface.co/datasets/Tngarg/French_of">Tngarg/French_of</a><br>
 
8
  </head>
9
  <body>
10
  <div>
11
+ <h1>Vous trouverez ci-dessous une liste de 140 jeux de données en français mal référencés sur le Hub :<br>
12
  Below is a list of 131 French datasets that are badly referenced on the Hub:</h1>
13
  </div>
14
  <br><br>
 
28
  <a href="https://huggingface.co/datasets/AdrienB134/QA_ASN_test">AdrienB134/QA_ASN_test</a><br>
29
  <a href="https://huggingface.co/datasets/AdrienB134/Small-markdown">AdrienB134/Small-markdown</a><br>
30
  <a href="https://huggingface.co/datasets/ahmadSiddiqi/x-stance_fr">ahmadSiddiqi/x-stance_fr</a><br>
31
+ <a href="https://huggingface.co/datasets/ahazeemi/iwslt14-en-fr">ahazeemi/iwslt14-en-fr</a><br>
32
  <a href="https://huggingface.co/datasets/Alwaly/fr_voxpopuli/">Alwaly/fr_voxpopuli/</a><br>
33
  <a href="https://huggingface.co/datasets/Alwaly/french-Wolof-lang-classification">Alwaly/french-Wolof-lang-classification</a><br>
34
  <a href="https://huggingface.co/datasets/Alwaly/frenchToWolof">Alwaly/frenchToWolof</a><br>
 
41
  <a href="https://huggingface.co/datasets/babs/unlabelled-french-voxpopuli">babs/unlabelled-french-voxpopuli</a><br>
42
  <a href="https://huggingface.co/datasets/BitTranslate/chatgpt-prompts-French">BitTranslate/chatgpt-prompts-French</a><br>
43
  <a href="https://huggingface.co/datasets/bosbos/french_english_instruct">bosbos/french_english_instruct</a><br>
44
+ <a href="https://huggingface.co/datasets/Brendan/nlp244_french_snli">Brendan/nlp244_french_snli</a><br>
45
  <a href="https://huggingface.co/datasets/Databasesprojec/FinStmts_ConsUncons_French_Predict_part1">Databasesprojec/FinStmts_ConsUncons_French_Predict_part1</a><br>
46
  <a href="https://huggingface.co/datasets/Databasesprojec/FinStmts_ConsUncons_French_Predict_part2">Databasesprojec/FinStmts_ConsUncons_French_Predict_part2</a><br>
47
  <a href="https://huggingface.co/datasets/Databasesprojec/FinStmts_ConsUncons_French_SeqClass">Databasesprojec/FinStmts_ConsUncons_French_SeqClass</a><br>
 
86
  <a href="https://huggingface.co/datasets/ismailiismail/French_English_2">ismailiismail/French_English_2</a><br>
87
  <a href="https://huggingface.co/datasets/ismailiismail/FrEn_handpicks">ismailiismail/FrEn_handpicks</a><br>
88
  <a href="https://huggingface.co/datasets/ismailiismail/ner">ismailiismail/ner</a><br>
89
+ <a href="https://huggingface.co/datasets/ismailiismail/multi_paraphrasing_french">ismailiismail/multi_paraphrasing_french</a><br>
90
  <a href="https://huggingface.co/datasets/ismailiismail/paragraphss_paraphrasing">ismailiismail/paragraphss_paraphrasing</a><br>
91
+ <a href="https://huggingface.co/datasets/ismailiismail/paraphrasing_french">ismailiismail/paraphrasing_french</a><br>
92
  <a href="https://huggingface.co/datasets/ismailiismail/paraphrasing_french_5000">ismailiismail/paraphrasing_french_5000</a><br>
93
 
94
  <a href="https://huggingface.co/datasets/jwang214/arc_french/">jwang214/arc_french/</a><br>
 
97
  <a href="https://huggingface.co/datasets/kaitchup/opus-French-to-English">kaitchup/opus-French-to-English</a><br>
98
  <a href="https://huggingface.co/datasets/kloodia/alpaca_french">kloodia/alpaca_french</a><br>
99
 
100
+ <a href="https://huggingface.co/datasets/Makxxx/wikinews">Makxxx/wikinews</a><br>
101
+ <a href="https://huggingface.co/datasets/malteos/french_CEFR">malteos/french_CEFR</a><br>
102
  <a href="https://huggingface.co/datasets/manu/croissant_french_dataset">manu/croissant_french_dataset</a><br>
103
  <a href="https://huggingface.co/datasets/manu/dataset_en_fr">manu/dataset_en_fr</a><br>
104
  <a href="https://huggingface.co/datasets/manu/dataset_en_fr_short">manu/dataset_en_fr_short</a><br>
 
124
  <a href="https://huggingface.co/datasets/Mediform/sharegpt-french">Mediform/sharegpt-french</a><br>
125
  <a href="https://huggingface.co/datasets/musts/french">musts/french</a><br>
126
 
127
+ <a href="https://huggingface.co/datasets/nielsr/datacomp_small_french_captions">nielsr/datacomp_small_french_captions</a><br>
128
  <a href="https://huggingface.co/datasets/nirantk/french-books">nirantk/french-books</a><br>
129
 
130
  <a href="https://huggingface.co/datasets/odunola/french-audio-preprocessed">odunola/french-audio-preprocessed</a><br>
 
136
  <a href="https://huggingface.co/datasets/paulml/chatml-OpenHermes2.5-dpo-binarized-alpha-french">paulml/chatml-OpenHermes2.5-dpo-binarized-alpha-french</a><br>
137
  <a href="https://huggingface.co/datasets/PHBJT/cml-tts-20percent-subset">PHBJT/cml-tts-20percent-subset</a><br>
138
  <a href="https://huggingface.co/datasets/Poulpidot/FrenchHateSpeechSuperset">Poulpidot/FrenchHateSpeechSuperset</a><br>
139
+ <a href="https://huggingface.co/datasets/pvisnrt/french-snli">pvisnrt/french-snli</a><br>
140
 
141
  <a href="https://huggingface.co/datasets/qanastek/ECDC">qanastek/ECDC</a><br>
142
 
 
152
  <a href="https://huggingface.co/datasets/shuyuej/French-MMLU-Medical-Genetics-Benchmark">shuyuej/French-MMLU-Medical-Genetics-Benchmark</a><br>
153
  <a href="https://huggingface.co/datasets/shuyuej/French-MMLU-Professional-Medicine-Benchmark">shuyuej/French-MMLU-Professional-Medicine-Benchmark</a><br>
154
  <a href="https://huggingface.co/datasets/startlingadama/bambara-french">startlingadama/bambara-french</a><br>
155
+ <a href="https://huggingface.co/datasets/sugam11/french-snli">sugam11/french-snli</a><br>
156
+
157
+ <a href="https://huggingface.co/datasets/tbboukhari/Alpaca-in-french">tbboukhari/Alpaca-in-french</a><br>
158
  <a href="https://huggingface.co/datasets/Tngarg/french_eng">Tngarg/french_eng</a><br>
159
  <a href="https://huggingface.co/datasets/Tngarg/french_english">Tngarg/french_english</a><br>
160
  <a href="https://huggingface.co/datasets/Tngarg/French_of">Tngarg/French_of</a><br>