Add link to paper, update tags
Browse filesThis PR improves the metadata of the model card, and ensures the model is linked to the paper page: https://huggingface.co/papers/2411.13676.
Cheers,
Niels
README.md
CHANGED
@@ -1,4 +1,6 @@
|
|
1 |
---
|
|
|
|
|
2 |
license: other
|
3 |
license_name: nvidia-open-model-license
|
4 |
license_link: https://developer.download.nvidia.com/licenses/nvidia-open-model-license-agreement-june-2024.pdf
|
@@ -142,11 +144,13 @@ Please report security vulnerabilities or NVIDIA AI Concerns [here](https://www.
|
|
142 |
|
143 |
## Citation
|
144 |
```
|
145 |
-
@
|
146 |
-
title={A Hybrid-head Architecture for Small Language Models},
|
147 |
-
author={Xin Dong and Yonggan Fu and Shizhe Diao and Wonmin Byeon and Zijia Chen and Ameya Sunil Mahabaleshwarkar and Shih-Yang Liu and Matthijs Van Keirsbilck and Min-Hung Chen and Yoshi Suhara and Yingyan
|
148 |
-
journal={arXiv preprint arXiv:xxxx},
|
149 |
year={2024},
|
150 |
-
|
|
|
|
|
|
|
151 |
}
|
152 |
```
|
|
|
1 |
---
|
2 |
+
library_name: transformers
|
3 |
+
pipeline_tag: text-generation
|
4 |
license: other
|
5 |
license_name: nvidia-open-model-license
|
6 |
license_link: https://developer.download.nvidia.com/licenses/nvidia-open-model-license-agreement-june-2024.pdf
|
|
|
144 |
|
145 |
## Citation
|
146 |
```
|
147 |
+
@misc{dong2024hymbahybridheadarchitecturesmall,
|
148 |
+
title={Hymba: A Hybrid-head Architecture for Small Language Models},
|
149 |
+
author={Xin Dong and Yonggan Fu and Shizhe Diao and Wonmin Byeon and Zijia Chen and Ameya Sunil Mahabaleshwarkar and Shih-Yang Liu and Matthijs Van Keirsbilck and Min-Hung Chen and Yoshi Suhara and Yingyan Lin and Jan Kautz and Pavlo Molchanov},
|
|
|
150 |
year={2024},
|
151 |
+
eprint={2411.13676},
|
152 |
+
archivePrefix={arXiv},
|
153 |
+
primaryClass={cs.CL},
|
154 |
+
url={https://arxiv.org/abs/2411.13676},
|
155 |
}
|
156 |
```
|