Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
eduagarcia
commited on
Commit
Β·
395f537
1
Parent(s):
b234783
New model_type: language adapt
Browse files- src/display/about.py +2 -1
- src/display/utils.py +4 -1
src/display/about.py
CHANGED
@@ -63,7 +63,8 @@ Side note on the baseline scores:
|
|
63 |
|
64 |
## Icons
|
65 |
- {ModelType.PT.to_str(" : ")} model: new, base models, trained on a given corpora
|
66 |
-
- {ModelType.
|
|
|
67 |
- {ModelType.chat.to_str(" : ")} model: chat like fine-tunes, either using IFT (datasets of task instruction), RLHF or DPO (changing the model loss a bit with an added policy), etc
|
68 |
- {ModelType.merges.to_str(" : ")} model: merges or MoErges, models which have been merged or fused without additional fine-tuning.
|
69 |
If there is no icon, we have not uploaded the information on the model yet, feel free to open an issue with the model information!
|
|
|
63 |
|
64 |
## Icons
|
65 |
- {ModelType.PT.to_str(" : ")} model: new, base models, trained on a given corpora
|
66 |
+
- {ModelType.LA.to_str(" : ")} model: pretained models adapted to another language with more further-pretraining or finetuning
|
67 |
+
- {ModelType.FT.to_str(" : ")} model: pretrained models finetuned or further-pretrained on more data
|
68 |
- {ModelType.chat.to_str(" : ")} model: chat like fine-tunes, either using IFT (datasets of task instruction), RLHF or DPO (changing the model loss a bit with an added policy), etc
|
69 |
- {ModelType.merges.to_str(" : ")} model: merges or MoErges, models which have been merged or fused without additional fine-tuning.
|
70 |
If there is no icon, we have not uploaded the information on the model yet, feel free to open an issue with the model information!
|
src/display/utils.py
CHANGED
@@ -165,7 +165,8 @@ class ModelDetails:
|
|
165 |
|
166 |
class ModelType(Enum):
|
167 |
PT = ModelDetails(name="pretrained", symbol="π’")
|
168 |
-
|
|
|
169 |
chat = ModelDetails(name="chat models (RLHF, DPO, IFT, ...)", symbol="π¬")
|
170 |
merges = ModelDetails(name="base merges and moerges", symbol="π€")
|
171 |
Unknown = ModelDetails(name="", symbol="?")
|
@@ -177,6 +178,8 @@ class ModelType(Enum):
|
|
177 |
def from_str(type):
|
178 |
if "fine-tuned" in type or "πΆ" in type:
|
179 |
return ModelType.FT
|
|
|
|
|
180 |
if "pretrained" in type or "π’" in type:
|
181 |
return ModelType.PT
|
182 |
if any([k in type for k in ["instruction-tuned", "RL-tuned", "chat", "π¦", "β", "π¬"]]):
|
|
|
165 |
|
166 |
class ModelType(Enum):
|
167 |
PT = ModelDetails(name="pretrained", symbol="π’")
|
168 |
+
LA = ModelDetails(name="language adapted models (FP, FT, ...)", symbol="π")
|
169 |
+
FT = ModelDetails(name="fine-tuned/fp on domain-specific datasets", symbol="πΆ")
|
170 |
chat = ModelDetails(name="chat models (RLHF, DPO, IFT, ...)", symbol="π¬")
|
171 |
merges = ModelDetails(name="base merges and moerges", symbol="π€")
|
172 |
Unknown = ModelDetails(name="", symbol="?")
|
|
|
178 |
def from_str(type):
|
179 |
if "fine-tuned" in type or "πΆ" in type:
|
180 |
return ModelType.FT
|
181 |
+
if "language" in type or "π" in type:
|
182 |
+
return ModelType.PT
|
183 |
if "pretrained" in type or "π’" in type:
|
184 |
return ModelType.PT
|
185 |
if any([k in type for k in ["instruction-tuned", "RL-tuned", "chat", "π¦", "β", "π¬"]]):
|