atharvanighot commited on
Commit
de2f903
·
verified ·
1 Parent(s): 2f59b0d

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "atharvanighot/tinyllama-ut",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
 
1
  {
2
+ "_name_or_path": "atharvanighot/tinyllama-pt",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a813fb5a4fbe1a63c83fb5ea91d0496cc0794623820b4a97f11a90a97a84195
3
  size 4811565790
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c704dd7a6380e2bf50aefcecea2db59a8863e761364d59c80eee9053e5dff0ea
3
  size 4811565790
special_tokens_map.json CHANGED
@@ -1,4 +1,11 @@
1
  {
 
 
 
 
 
 
 
2
  "cls_token": {
3
  "content": "[CLS]",
4
  "lstrip": false,
@@ -6,6 +13,13 @@
6
  "rstrip": false,
7
  "single_word": false
8
  },
 
 
 
 
 
 
 
9
  "mask_token": {
10
  "content": "[MASK]",
11
  "lstrip": false,
@@ -28,7 +42,7 @@
28
  "single_word": false
29
  },
30
  "unk_token": {
31
- "content": "[UNK]",
32
  "lstrip": false,
33
  "normalized": false,
34
  "rstrip": false,
 
1
  {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
  "cls_token": {
10
  "content": "[CLS]",
11
  "lstrip": false,
 
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
+ "eos_token": {
17
+ "content": "</s>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
  "mask_token": {
24
  "content": "[MASK]",
25
  "lstrip": false,
 
42
  "single_word": false
43
  },
44
  "unk_token": {
45
+ "content": "<unk>",
46
  "lstrip": false,
47
  "normalized": false,
48
  "rstrip": false,
tokenizer_config.json CHANGED
@@ -65,12 +65,14 @@
65
  "special": true
66
  }
67
  },
 
68
  "clean_up_tokenization_spaces": false,
69
  "cls_token": "[CLS]",
 
70
  "mask_token": "[MASK]",
71
  "model_max_length": 1000000000000000019884624838656,
72
  "pad_token": "[PAD]",
73
  "sep_token": "[SEP]",
74
  "tokenizer_class": "PreTrainedTokenizerFast",
75
- "unk_token": "[UNK]"
76
  }
 
65
  "special": true
66
  }
67
  },
68
+ "bos_token": "<s>",
69
  "clean_up_tokenization_spaces": false,
70
  "cls_token": "[CLS]",
71
+ "eos_token": "</s>",
72
  "mask_token": "[MASK]",
73
  "model_max_length": 1000000000000000019884624838656,
74
  "pad_token": "[PAD]",
75
  "sep_token": "[SEP]",
76
  "tokenizer_class": "PreTrainedTokenizerFast",
77
+ "unk_token": "<unk>"
78
  }