bn999 commited on
Commit
8818646
·
verified ·
1 Parent(s): e5421f6

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +0 -94
README.md CHANGED
@@ -4,97 +4,3 @@ base_model: mistralai/Mistral-7B-v0.1
4
  ---
5
 
6
  Selectively pruned and re-trained Mistral-7B for reduced size, targeting only MPT layers.
7
-
8
-
9
- @misc{open-llm-leaderboard,
10
- author = {Edward Beeching and Clémentine Fourrier and Nathan Habib and Sheon Han and Nathan Lambert and Nazneen Rajani and Omar Sanseviero and Lewis Tunstall and Thomas Wolf},
11
- title = {Open LLM Leaderboard},
12
- year = {2023},
13
- publisher = {Hugging Face},
14
- howpublished = "\url{https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard}"
15
- }
16
- @software{eval-harness,
17
- author = {Gao, Leo and
18
- Tow, Jonathan and
19
- Biderman, Stella and
20
- Black, Sid and
21
- DiPofi, Anthony and
22
- Foster, Charles and
23
- Golding, Laurence and
24
- Hsu, Jeffrey and
25
- McDonell, Kyle and
26
- Muennighoff, Niklas and
27
- Phang, Jason and
28
- Reynolds, Laria and
29
- Tang, Eric and
30
- Thite, Anish and
31
- Wang, Ben and
32
- Wang, Kevin and
33
- Zou, Andy},
34
- title = {A framework for few-shot language model evaluation},
35
- month = sep,
36
- year = 2021,
37
- publisher = {Zenodo},
38
- version = {v0.0.1},
39
- doi = {10.5281/zenodo.5371628},
40
- url = {https://doi.org/10.5281/zenodo.5371628}
41
- }
42
- @misc{clark2018think,
43
- title={Think you have Solved Question Answering? Try ARC, the AI2 Reasoning Challenge},
44
- author={Peter Clark and Isaac Cowhey and Oren Etzioni and Tushar Khot and Ashish Sabharwal and Carissa Schoenick and Oyvind Tafjord},
45
- year={2018},
46
- eprint={1803.05457},
47
- archivePrefix={arXiv},
48
- primaryClass={cs.AI}
49
- }
50
- @misc{zellers2019hellaswag,
51
- title={HellaSwag: Can a Machine Really Finish Your Sentence?},
52
- author={Rowan Zellers and Ari Holtzman and Yonatan Bisk and Ali Farhadi and Yejin Choi},
53
- year={2019},
54
- eprint={1905.07830},
55
- archivePrefix={arXiv},
56
- primaryClass={cs.CL}
57
- }
58
- @misc{hendrycks2021measuring,
59
- title={Measuring Massive Multitask Language Understanding},
60
- author={Dan Hendrycks and Collin Burns and Steven Basart and Andy Zou and Mantas Mazeika and Dawn Song and Jacob Steinhardt},
61
- year={2021},
62
- eprint={2009.03300},
63
- archivePrefix={arXiv},
64
- primaryClass={cs.CY}
65
- }
66
- @misc{lin2022truthfulqa,
67
- title={TruthfulQA: Measuring How Models Mimic Human Falsehoods},
68
- author={Stephanie Lin and Jacob Hilton and Owain Evans},
69
- year={2022},
70
- eprint={2109.07958},
71
- archivePrefix={arXiv},
72
- primaryClass={cs.CL}
73
- }
74
- @misc{DBLP:journals/corr/abs-1907-10641,
75
- title={{WINOGRANDE:} An Adversarial Winograd Schema Challenge at Scale},
76
- author={Keisuke Sakaguchi and Ronan Le Bras and Chandra Bhagavatula and Yejin Choi},
77
- year={2019},
78
- eprint={1907.10641},
79
- archivePrefix={arXiv},
80
- primaryClass={cs.CL}
81
- }
82
- @misc{DBLP:journals/corr/abs-2110-14168,
83
- title={Training Verifiers to Solve Math Word Problems},
84
- author={Karl Cobbe and
85
- Vineet Kosaraju and
86
- Mohammad Bavarian and
87
- Mark Chen and
88
- Heewoo Jun and
89
- Lukasz Kaiser and
90
- Matthias Plappert and
91
- Jerry Tworek and
92
- Jacob Hilton and
93
- Reiichiro Nakano and
94
- Christopher Hesse and
95
- John Schulman},
96
- year={2021},
97
- eprint={2110.14168},
98
- archivePrefix={arXiv},
99
- primaryClass={cs.CL}
100
- }
 
4
  ---
5
 
6
  Selectively pruned and re-trained Mistral-7B for reduced size, targeting only MPT layers.