heichow commited on
Commit
74a9036
·
verified ·
1 Parent(s): 05bce46

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,15 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ compiled/014f9e0f66728f19429b.neff filter=lfs diff=lfs merge=lfs -text
37
+ compiled/0cfaffdcfdbd5a217685.neff filter=lfs diff=lfs merge=lfs -text
38
+ compiled/20a998c1e2b2fac0e029.neff filter=lfs diff=lfs merge=lfs -text
39
+ compiled/366225effb325603b39c.neff filter=lfs diff=lfs merge=lfs -text
40
+ compiled/43618e9d5a7af44b2f47.neff filter=lfs diff=lfs merge=lfs -text
41
+ compiled/5ca18545e6b19c345a40.neff filter=lfs diff=lfs merge=lfs -text
42
+ compiled/6a7ed55d61647f668cae.neff filter=lfs diff=lfs merge=lfs -text
43
+ compiled/954e6d9355da77842d33.neff filter=lfs diff=lfs merge=lfs -text
44
+ compiled/9e760b2f376143a0f380.neff filter=lfs diff=lfs merge=lfs -text
45
+ compiled/a0cb8512168ca10205b9.neff filter=lfs diff=lfs merge=lfs -text
46
+ compiled/bc969b06aa6c80aab625.neff filter=lfs diff=lfs merge=lfs -text
47
+ compiled/c6bc2fbdbc03296ac8a5.neff filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: cc-by-sa-4.0
3
+ base_model: meta-llama/Llama-2-7b
4
+ language:
5
+ - yue
6
+ pipeline_tag: text-generation
7
+ tags:
8
+ - cantonese
9
+ - llama-2
10
+ - Powered by AWS Trainium
11
+ ---
12
+
13
+ # Cantonese LLM using Llama-2 7B Architecture
14
+
15
+ Welcome to the preview of the Cantonese Language Model (LLM) built on the Llama-2 7B architecture. This model is designed to understand and generate text in Cantonese, including slangs, colloquials, and Internet terms.
16
+
17
+ ## License
18
+ This project is available under the Creative Commons Attribution-ShareAlike 4.0 International License (CC BY-SA 4.0). For more details, please visit the [license page](https://creativecommons.org/licenses/by-sa/4.0/).
19
+
20
+ ## Preview Warning
21
+ Please be advised that this version of the Cantonese LLM is a **preview**. As such, the model's outputs may sometimes be inaccurate, hallucinatory, or potentially offensive to some individuals. We are continuously working to improve the model's accuracy and reduce such instances.
22
+
23
+ ## Training Infrastructure
24
+ The Cantonese LLM has been trained using Amazon HyperPod and AWS Trainium chips.
25
+
26
+ ## Training Credits
27
+ This model was trained by [Votee AI Limited](https://huggingface.co/votee), and we contribute to [hon9kon9ize](https://hon9kon9ize.com/), the Hong Kong AI Research Community.
28
+
29
+ ## Usage Guidelines
30
+ - Ensure that you are aware of the potential for unexpected or offensive content.
31
+ - Always review and assess the model's output before using it in any application.
32
+ - Provide feedback on any issues you encounter to help us improve the model.
33
+
34
+ ## Contributions
35
+ We welcome contributions from the community. If you have suggestions or improvements, please submit a pull request or open an issue in the project repository.
36
+
37
+ ## Disclaimer
38
+ The developers of the Cantonese LLM are not responsible for any harm or offense caused by the model's outputs. Users are advised to exercise discretion and judgment when using the model.
39
+
40
+ Thank you for exploring the Cantonese LLM. We are excited to see the innovative ways in which it will be used!
compiled/014f9e0f66728f19429b.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02efa6ff620ff3f97bc1723d0992016eba1f1018b0919c1cf6e8c133290d69e5
3
+ size 12452864
compiled/0cfaffdcfdbd5a217685.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fcbc5fc5791df4d19d9547e3eaf6b60f7a3fee0ef494264727f2b88572094a74
3
+ size 21556224
compiled/20a998c1e2b2fac0e029.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6028a12471abd09662eaa30f35be31f3f713722d6976a8353253548e4678a2b5
3
+ size 11203584
compiled/366225effb325603b39c.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8651aa6df6702dcd52dbfd3036c70b14c4b95f1f5cf4a86c18044dfff9a1bb1f
3
+ size 10415104
compiled/43618e9d5a7af44b2f47.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c4830d140e1421d7943f55d974b2a9fd51aa01b4b8df9c68ba488a4b04dc20c
3
+ size 10251264
compiled/5ca18545e6b19c345a40.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:766383b4fd27ceb3cd94c05a2abcb240dcc7b224ca2b2f59ea46a20d689f23a2
3
+ size 12073984
compiled/6a7ed55d61647f668cae.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3d4f58ae1633c4027277dd7a0fff2309b770f6275eab78295e24c839d8db84a
3
+ size 10404864
compiled/954e6d9355da77842d33.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85df1700ded0c026400ccee4c8d6109102bda2f958b4b170ff21080600a55e3c
3
+ size 12657664
compiled/9e760b2f376143a0f380.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8ba49fb1e19c1fcacff2cca4dff9e12140c9a6c72929cead974dca6fc9f9353
3
+ size 10681344
compiled/a0cb8512168ca10205b9.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a3b2415a03dd53c0935cc85c8638ce308411c5c9a91a5cda3bed79e54043e22
3
+ size 12329984
compiled/bc969b06aa6c80aab625.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:630a0f03933dbcf7f962197a6c8641da1059a6e317cd9eb5e4f91149a2e1c0aa
3
+ size 10179584
compiled/c6bc2fbdbc03296ac8a5.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d76f2109261297c222e593e124ce2af9067944f516e74ae801fddfae58219ba
3
+ size 4895744
config.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "meta-llama/Llama-2-7b-hf",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "bos_token_id": 1,
7
+ "eos_token_id": 2,
8
+ "hidden_act": "silu",
9
+ "hidden_size": 4096,
10
+ "initializer_range": 0.02,
11
+ "intermediate_size": 11008,
12
+ "max_position_embeddings": 4096,
13
+ "model_type": "llama",
14
+ "num_attention_heads": 32,
15
+ "num_hidden_layers": 32,
16
+ "num_key_value_heads": 32,
17
+ "pad_token_id": 0,
18
+ "pretraining_tp": 1,
19
+ "rms_norm_eps": 1e-05,
20
+ "rope_scaling": null,
21
+ "tie_word_embeddings": false,
22
+ "torch_dtype": "float16",
23
+ "transformers_version": "4.31.0",
24
+ "use_cache": true,
25
+ "vocab_size": 32000
26
+ }
generation_config.json ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 1,
3
+ "do_sample": true,
4
+ "eos_token_id": 2,
5
+ "max_length": 4096,
6
+ "max_memory": {
7
+ "cpu": 507036852224
8
+ },
9
+ "no_split_module_classes": [
10
+ "LlamaDecoderLayer"
11
+ ],
12
+ "pad_token_id": 0,
13
+ "special_dtypes": {},
14
+ "temperature": 0.6,
15
+ "top_p": 0.9,
16
+ "transformers_version": "4.31.0"
17
+ }
special_tokens_map.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "</s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "unk_token": {
17
+ "content": "<unk>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ }
23
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
3
+ size 499723
tokenizer_config.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "__type": "AddedToken",
4
+ "content": "<s>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false
9
+ },
10
+ "clean_up_tokenization_spaces": false,
11
+ "eos_token": {
12
+ "__type": "AddedToken",
13
+ "content": "</s>",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false
18
+ },
19
+ "legacy": false,
20
+ "model_max_length": 1000000000000000019884624838656,
21
+ "pad_token": null,
22
+ "padding_side": "right",
23
+ "sp_model_kwargs": {},
24
+ "tokenizer_class": "LlamaTokenizer",
25
+ "unk_token": {
26
+ "__type": "AddedToken",
27
+ "content": "<unk>",
28
+ "lstrip": false,
29
+ "normalized": false,
30
+ "rstrip": false,
31
+ "single_word": false
32
+ }
33
+ }