Training in progress, step 100
Browse files- added_tokens.json +31 -40
- config.json +2 -2
- model.safetensors +2 -2
- preprocessor_config.json +1 -1
- runs/Nov03_15-28-31_12e2880e4751/events.out.tfevents.1730647765.12e2880e4751.1950.0 +3 -0
- special_tokens_map.json +4 -28
- tokenizer_config.json +30 -126
- training_args.bin +1 -1
added_tokens.json
CHANGED
@@ -1,43 +1,34 @@
|
|
1 |
{
|
2 |
-
" ":
|
3 |
"<pad>": 86,
|
4 |
-
"
|
5 |
-
"
|
6 |
-
"
|
7 |
-
"
|
8 |
-
"
|
9 |
-
"
|
10 |
-
"
|
11 |
-
"
|
12 |
-
"
|
13 |
-
"
|
14 |
-
"
|
15 |
-
"
|
16 |
-
"
|
17 |
-
"
|
18 |
-
"
|
19 |
-
"
|
20 |
-
"
|
21 |
-
"
|
22 |
-
"
|
23 |
-
"
|
24 |
-
"
|
25 |
-
"
|
26 |
-
"
|
27 |
-
"
|
28 |
-
"
|
29 |
-
"
|
30 |
-
"
|
31 |
-
"
|
32 |
-
"
|
33 |
-
"
|
34 |
-
"۔": 91,
|
35 |
-
"۽": 113,
|
36 |
-
"۾": 118,
|
37 |
-
"": 94,
|
38 |
-
"–": 124,
|
39 |
-
"—": 106,
|
40 |
-
"‘": 102,
|
41 |
-
"’": 119,
|
42 |
-
"”": 92
|
43 |
}
|
|
|
1 |
{
|
2 |
+
" ": 101,
|
3 |
"<pad>": 86,
|
4 |
+
"é": 95,
|
5 |
+
"ٺ": 91,
|
6 |
+
"ٻ": 99,
|
7 |
+
"ٽ": 87,
|
8 |
+
"پ": 96,
|
9 |
+
"ٿ": 103,
|
10 |
+
"ڀ": 109,
|
11 |
+
"ڃ": 98,
|
12 |
+
"ڄ": 90,
|
13 |
+
"ڇ": 106,
|
14 |
+
"ڊ": 110,
|
15 |
+
"ڌ": 116,
|
16 |
+
"ڍ": 102,
|
17 |
+
"ڏ": 92,
|
18 |
+
"ڙ": 105,
|
19 |
+
"ڦ": 112,
|
20 |
+
"ڪ": 115,
|
21 |
+
"ڱ": 104,
|
22 |
+
"ڳ": 89,
|
23 |
+
"ں": 111,
|
24 |
+
"ڻ": 94,
|
25 |
+
"ھ": 97,
|
26 |
+
"ہ": 108,
|
27 |
+
"۽": 107,
|
28 |
+
"۾": 117,
|
29 |
+
"–": 113,
|
30 |
+
"—": 100,
|
31 |
+
"‘": 93,
|
32 |
+
"’": 114,
|
33 |
+
"”": 88
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
34 |
}
|
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "
|
3 |
"activation_dropout": 0.1,
|
4 |
"apply_spec_augment": true,
|
5 |
"architectures": [
|
@@ -88,5 +88,5 @@
|
|
88 |
"transformers_version": "4.44.2",
|
89 |
"use_cache": false,
|
90 |
"use_guided_attention_loss": true,
|
91 |
-
"vocab_size":
|
92 |
}
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "MBZUAI/speecht5_tts_clartts_ar",
|
3 |
"activation_dropout": 0.1,
|
4 |
"apply_spec_augment": true,
|
5 |
"architectures": [
|
|
|
88 |
"transformers_version": "4.44.2",
|
89 |
"use_cache": false,
|
90 |
"use_guided_attention_loss": true,
|
91 |
+
"vocab_size": 118
|
92 |
}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:671e9df12175ed01ae1996a657fe418518cc2125f88bb029635640627b0f2ef2
|
3 |
+
size 577902984
|
preprocessor_config.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
"do_normalize": false,
|
3 |
"feature_extractor_type": "SpeechT5FeatureExtractor",
|
4 |
-
"feature_size":
|
5 |
"fmax": 7600,
|
6 |
"fmin": 80,
|
7 |
"frame_signal_scale": 1.0,
|
|
|
1 |
{
|
2 |
"do_normalize": false,
|
3 |
"feature_extractor_type": "SpeechT5FeatureExtractor",
|
4 |
+
"feature_size": 1,
|
5 |
"fmax": 7600,
|
6 |
"fmin": 80,
|
7 |
"frame_signal_scale": 1.0,
|
runs/Nov03_15-28-31_12e2880e4751/events.out.tfevents.1730647765.12e2880e4751.1950.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5332658b8c82a689f8c17d060fd611390c30344fc3057c42c606393a438ab314
|
3 |
+
size 7636
|
special_tokens_map.json
CHANGED
@@ -1,30 +1,6 @@
|
|
1 |
{
|
2 |
-
"bos_token":
|
3 |
-
|
4 |
-
|
5 |
-
|
6 |
-
"rstrip": false,
|
7 |
-
"single_word": false
|
8 |
-
},
|
9 |
-
"eos_token": {
|
10 |
-
"content": "</s>",
|
11 |
-
"lstrip": false,
|
12 |
-
"normalized": false,
|
13 |
-
"rstrip": false,
|
14 |
-
"single_word": false
|
15 |
-
},
|
16 |
-
"pad_token": {
|
17 |
-
"content": "<pad>",
|
18 |
-
"lstrip": false,
|
19 |
-
"normalized": false,
|
20 |
-
"rstrip": false,
|
21 |
-
"single_word": false
|
22 |
-
},
|
23 |
-
"unk_token": {
|
24 |
-
"content": "<unk>",
|
25 |
-
"lstrip": false,
|
26 |
-
"normalized": false,
|
27 |
-
"rstrip": false,
|
28 |
-
"single_word": false
|
29 |
-
}
|
30 |
}
|
|
|
1 |
{
|
2 |
+
"bos_token": "<s>",
|
3 |
+
"eos_token": "</s>",
|
4 |
+
"pad_token": "<pad>",
|
5 |
+
"unk_token": "<unk>"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
6 |
}
|
tokenizer_config.json
CHANGED
@@ -272,14 +272,6 @@
|
|
272 |
"single_word": false,
|
273 |
"special": false
|
274 |
},
|
275 |
-
"39": {
|
276 |
-
"content": "ؤ",
|
277 |
-
"lstrip": false,
|
278 |
-
"normalized": true,
|
279 |
-
"rstrip": false,
|
280 |
-
"single_word": false,
|
281 |
-
"special": false
|
282 |
-
},
|
283 |
"40": {
|
284 |
"content": "0",
|
285 |
"lstrip": false,
|
@@ -552,14 +544,6 @@
|
|
552 |
"single_word": false,
|
553 |
"special": false
|
554 |
},
|
555 |
-
"77": {
|
556 |
-
"content": "j",
|
557 |
-
"lstrip": false,
|
558 |
-
"normalized": true,
|
559 |
-
"rstrip": false,
|
560 |
-
"single_word": false,
|
561 |
-
"special": false
|
562 |
-
},
|
563 |
"78": {
|
564 |
"content": "z",
|
565 |
"lstrip": false,
|
@@ -592,14 +576,6 @@
|
|
592 |
"single_word": false,
|
593 |
"special": false
|
594 |
},
|
595 |
-
"82": {
|
596 |
-
"content": "q",
|
597 |
-
"lstrip": false,
|
598 |
-
"normalized": true,
|
599 |
-
"rstrip": false,
|
600 |
-
"single_word": false,
|
601 |
-
"special": false
|
602 |
-
},
|
603 |
"85": {
|
604 |
"content": "چ",
|
605 |
"lstrip": false,
|
@@ -617,7 +593,7 @@
|
|
617 |
"special": true
|
618 |
},
|
619 |
"87": {
|
620 |
-
"content": "
|
621 |
"lstrip": false,
|
622 |
"normalized": true,
|
623 |
"rstrip": false,
|
@@ -625,7 +601,7 @@
|
|
625 |
"special": false
|
626 |
},
|
627 |
"88": {
|
628 |
-
"content": "
|
629 |
"lstrip": false,
|
630 |
"normalized": true,
|
631 |
"rstrip": false,
|
@@ -633,7 +609,7 @@
|
|
633 |
"special": false
|
634 |
},
|
635 |
"89": {
|
636 |
-
"content": "
|
637 |
"lstrip": false,
|
638 |
"normalized": true,
|
639 |
"rstrip": false,
|
@@ -641,7 +617,7 @@
|
|
641 |
"special": false
|
642 |
},
|
643 |
"90": {
|
644 |
-
"content": "
|
645 |
"lstrip": false,
|
646 |
"normalized": true,
|
647 |
"rstrip": false,
|
@@ -649,7 +625,7 @@
|
|
649 |
"special": false
|
650 |
},
|
651 |
"91": {
|
652 |
-
"content": "
|
653 |
"lstrip": false,
|
654 |
"normalized": true,
|
655 |
"rstrip": false,
|
@@ -657,7 +633,7 @@
|
|
657 |
"special": false
|
658 |
},
|
659 |
"92": {
|
660 |
-
"content": "
|
661 |
"lstrip": false,
|
662 |
"normalized": true,
|
663 |
"rstrip": false,
|
@@ -665,7 +641,7 @@
|
|
665 |
"special": false
|
666 |
},
|
667 |
"93": {
|
668 |
-
"content": "
|
669 |
"lstrip": false,
|
670 |
"normalized": true,
|
671 |
"rstrip": false,
|
@@ -673,7 +649,7 @@
|
|
673 |
"special": false
|
674 |
},
|
675 |
"94": {
|
676 |
-
"content": "
|
677 |
"lstrip": false,
|
678 |
"normalized": true,
|
679 |
"rstrip": false,
|
@@ -681,7 +657,7 @@
|
|
681 |
"special": false
|
682 |
},
|
683 |
"95": {
|
684 |
-
"content": "
|
685 |
"lstrip": false,
|
686 |
"normalized": true,
|
687 |
"rstrip": false,
|
@@ -689,7 +665,7 @@
|
|
689 |
"special": false
|
690 |
},
|
691 |
"96": {
|
692 |
-
"content": "
|
693 |
"lstrip": false,
|
694 |
"normalized": true,
|
695 |
"rstrip": false,
|
@@ -697,7 +673,7 @@
|
|
697 |
"special": false
|
698 |
},
|
699 |
"97": {
|
700 |
-
"content": "
|
701 |
"lstrip": false,
|
702 |
"normalized": true,
|
703 |
"rstrip": false,
|
@@ -705,7 +681,7 @@
|
|
705 |
"special": false
|
706 |
},
|
707 |
"98": {
|
708 |
-
"content": "
|
709 |
"lstrip": false,
|
710 |
"normalized": true,
|
711 |
"rstrip": false,
|
@@ -713,7 +689,7 @@
|
|
713 |
"special": false
|
714 |
},
|
715 |
"99": {
|
716 |
-
"content": "
|
717 |
"lstrip": false,
|
718 |
"normalized": true,
|
719 |
"rstrip": false,
|
@@ -721,7 +697,7 @@
|
|
721 |
"special": false
|
722 |
},
|
723 |
"100": {
|
724 |
-
"content": "
|
725 |
"lstrip": false,
|
726 |
"normalized": true,
|
727 |
"rstrip": false,
|
@@ -729,7 +705,7 @@
|
|
729 |
"special": false
|
730 |
},
|
731 |
"101": {
|
732 |
-
"content": "
|
733 |
"lstrip": false,
|
734 |
"normalized": true,
|
735 |
"rstrip": false,
|
@@ -737,7 +713,7 @@
|
|
737 |
"special": false
|
738 |
},
|
739 |
"102": {
|
740 |
-
"content": "
|
741 |
"lstrip": false,
|
742 |
"normalized": true,
|
743 |
"rstrip": false,
|
@@ -745,7 +721,7 @@
|
|
745 |
"special": false
|
746 |
},
|
747 |
"103": {
|
748 |
-
"content": "
|
749 |
"lstrip": false,
|
750 |
"normalized": true,
|
751 |
"rstrip": false,
|
@@ -753,7 +729,7 @@
|
|
753 |
"special": false
|
754 |
},
|
755 |
"104": {
|
756 |
-
"content": "
|
757 |
"lstrip": false,
|
758 |
"normalized": true,
|
759 |
"rstrip": false,
|
@@ -761,7 +737,7 @@
|
|
761 |
"special": false
|
762 |
},
|
763 |
"105": {
|
764 |
-
"content": "
|
765 |
"lstrip": false,
|
766 |
"normalized": true,
|
767 |
"rstrip": false,
|
@@ -769,7 +745,7 @@
|
|
769 |
"special": false
|
770 |
},
|
771 |
"106": {
|
772 |
-
"content": "
|
773 |
"lstrip": false,
|
774 |
"normalized": true,
|
775 |
"rstrip": false,
|
@@ -777,7 +753,7 @@
|
|
777 |
"special": false
|
778 |
},
|
779 |
"107": {
|
780 |
-
"content": "
|
781 |
"lstrip": false,
|
782 |
"normalized": true,
|
783 |
"rstrip": false,
|
@@ -785,7 +761,7 @@
|
|
785 |
"special": false
|
786 |
},
|
787 |
"108": {
|
788 |
-
"content": "
|
789 |
"lstrip": false,
|
790 |
"normalized": true,
|
791 |
"rstrip": false,
|
@@ -793,7 +769,7 @@
|
|
793 |
"special": false
|
794 |
},
|
795 |
"109": {
|
796 |
-
"content": "
|
797 |
"lstrip": false,
|
798 |
"normalized": true,
|
799 |
"rstrip": false,
|
@@ -801,7 +777,7 @@
|
|
801 |
"special": false
|
802 |
},
|
803 |
"110": {
|
804 |
-
"content": "
|
805 |
"lstrip": false,
|
806 |
"normalized": true,
|
807 |
"rstrip": false,
|
@@ -809,7 +785,7 @@
|
|
809 |
"special": false
|
810 |
},
|
811 |
"111": {
|
812 |
-
"content": "
|
813 |
"lstrip": false,
|
814 |
"normalized": true,
|
815 |
"rstrip": false,
|
@@ -817,7 +793,7 @@
|
|
817 |
"special": false
|
818 |
},
|
819 |
"112": {
|
820 |
-
"content": "
|
821 |
"lstrip": false,
|
822 |
"normalized": true,
|
823 |
"rstrip": false,
|
@@ -825,7 +801,7 @@
|
|
825 |
"special": false
|
826 |
},
|
827 |
"113": {
|
828 |
-
"content": "
|
829 |
"lstrip": false,
|
830 |
"normalized": true,
|
831 |
"rstrip": false,
|
@@ -833,7 +809,7 @@
|
|
833 |
"special": false
|
834 |
},
|
835 |
"114": {
|
836 |
-
"content": "
|
837 |
"lstrip": false,
|
838 |
"normalized": true,
|
839 |
"rstrip": false,
|
@@ -841,7 +817,7 @@
|
|
841 |
"special": false
|
842 |
},
|
843 |
"115": {
|
844 |
-
"content": "
|
845 |
"lstrip": false,
|
846 |
"normalized": true,
|
847 |
"rstrip": false,
|
@@ -849,7 +825,7 @@
|
|
849 |
"special": false
|
850 |
},
|
851 |
"116": {
|
852 |
-
"content": "
|
853 |
"lstrip": false,
|
854 |
"normalized": true,
|
855 |
"rstrip": false,
|
@@ -857,84 +833,12 @@
|
|
857 |
"special": false
|
858 |
},
|
859 |
"117": {
|
860 |
-
"content": "ڻ",
|
861 |
-
"lstrip": false,
|
862 |
-
"normalized": true,
|
863 |
-
"rstrip": false,
|
864 |
-
"single_word": false,
|
865 |
-
"special": false
|
866 |
-
},
|
867 |
-
"118": {
|
868 |
"content": "۾",
|
869 |
"lstrip": false,
|
870 |
"normalized": true,
|
871 |
"rstrip": false,
|
872 |
"single_word": false,
|
873 |
"special": false
|
874 |
-
},
|
875 |
-
"119": {
|
876 |
-
"content": "’",
|
877 |
-
"lstrip": false,
|
878 |
-
"normalized": true,
|
879 |
-
"rstrip": false,
|
880 |
-
"single_word": false,
|
881 |
-
"special": false
|
882 |
-
},
|
883 |
-
"120": {
|
884 |
-
"content": "ڳ",
|
885 |
-
"lstrip": false,
|
886 |
-
"normalized": true,
|
887 |
-
"rstrip": false,
|
888 |
-
"single_word": false,
|
889 |
-
"special": false
|
890 |
-
},
|
891 |
-
"121": {
|
892 |
-
"content": "ڌ",
|
893 |
-
"lstrip": false,
|
894 |
-
"normalized": true,
|
895 |
-
"rstrip": false,
|
896 |
-
"single_word": false,
|
897 |
-
"special": false
|
898 |
-
},
|
899 |
-
"122": {
|
900 |
-
"content": "ٻ",
|
901 |
-
"lstrip": false,
|
902 |
-
"normalized": true,
|
903 |
-
"rstrip": false,
|
904 |
-
"single_word": false,
|
905 |
-
"special": false
|
906 |
-
},
|
907 |
-
"123": {
|
908 |
-
"content": "½",
|
909 |
-
"lstrip": false,
|
910 |
-
"normalized": true,
|
911 |
-
"rstrip": false,
|
912 |
-
"single_word": false,
|
913 |
-
"special": false
|
914 |
-
},
|
915 |
-
"124": {
|
916 |
-
"content": "–",
|
917 |
-
"lstrip": false,
|
918 |
-
"normalized": true,
|
919 |
-
"rstrip": false,
|
920 |
-
"single_word": false,
|
921 |
-
"special": false
|
922 |
-
},
|
923 |
-
"125": {
|
924 |
-
"content": "ڃ",
|
925 |
-
"lstrip": false,
|
926 |
-
"normalized": true,
|
927 |
-
"rstrip": false,
|
928 |
-
"single_word": false,
|
929 |
-
"special": false
|
930 |
-
},
|
931 |
-
"126": {
|
932 |
-
"content": "°",
|
933 |
-
"lstrip": false,
|
934 |
-
"normalized": true,
|
935 |
-
"rstrip": false,
|
936 |
-
"single_word": false,
|
937 |
-
"special": false
|
938 |
}
|
939 |
},
|
940 |
"bos_token": "<s>",
|
|
|
272 |
"single_word": false,
|
273 |
"special": false
|
274 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
275 |
"40": {
|
276 |
"content": "0",
|
277 |
"lstrip": false,
|
|
|
544 |
"single_word": false,
|
545 |
"special": false
|
546 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
547 |
"78": {
|
548 |
"content": "z",
|
549 |
"lstrip": false,
|
|
|
576 |
"single_word": false,
|
577 |
"special": false
|
578 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
579 |
"85": {
|
580 |
"content": "چ",
|
581 |
"lstrip": false,
|
|
|
593 |
"special": true
|
594 |
},
|
595 |
"87": {
|
596 |
+
"content": "ٽ",
|
597 |
"lstrip": false,
|
598 |
"normalized": true,
|
599 |
"rstrip": false,
|
|
|
601 |
"special": false
|
602 |
},
|
603 |
"88": {
|
604 |
+
"content": "”",
|
605 |
"lstrip": false,
|
606 |
"normalized": true,
|
607 |
"rstrip": false,
|
|
|
609 |
"special": false
|
610 |
},
|
611 |
"89": {
|
612 |
+
"content": "ڳ",
|
613 |
"lstrip": false,
|
614 |
"normalized": true,
|
615 |
"rstrip": false,
|
|
|
617 |
"special": false
|
618 |
},
|
619 |
"90": {
|
620 |
+
"content": "ڄ",
|
621 |
"lstrip": false,
|
622 |
"normalized": true,
|
623 |
"rstrip": false,
|
|
|
625 |
"special": false
|
626 |
},
|
627 |
"91": {
|
628 |
+
"content": "ٺ",
|
629 |
"lstrip": false,
|
630 |
"normalized": true,
|
631 |
"rstrip": false,
|
|
|
633 |
"special": false
|
634 |
},
|
635 |
"92": {
|
636 |
+
"content": "ڏ",
|
637 |
"lstrip": false,
|
638 |
"normalized": true,
|
639 |
"rstrip": false,
|
|
|
641 |
"special": false
|
642 |
},
|
643 |
"93": {
|
644 |
+
"content": "‘",
|
645 |
"lstrip": false,
|
646 |
"normalized": true,
|
647 |
"rstrip": false,
|
|
|
649 |
"special": false
|
650 |
},
|
651 |
"94": {
|
652 |
+
"content": "ڻ",
|
653 |
"lstrip": false,
|
654 |
"normalized": true,
|
655 |
"rstrip": false,
|
|
|
657 |
"special": false
|
658 |
},
|
659 |
"95": {
|
660 |
+
"content": "é",
|
661 |
"lstrip": false,
|
662 |
"normalized": true,
|
663 |
"rstrip": false,
|
|
|
665 |
"special": false
|
666 |
},
|
667 |
"96": {
|
668 |
+
"content": "پ",
|
669 |
"lstrip": false,
|
670 |
"normalized": true,
|
671 |
"rstrip": false,
|
|
|
673 |
"special": false
|
674 |
},
|
675 |
"97": {
|
676 |
+
"content": "ھ",
|
677 |
"lstrip": false,
|
678 |
"normalized": true,
|
679 |
"rstrip": false,
|
|
|
681 |
"special": false
|
682 |
},
|
683 |
"98": {
|
684 |
+
"content": "ڃ",
|
685 |
"lstrip": false,
|
686 |
"normalized": true,
|
687 |
"rstrip": false,
|
|
|
689 |
"special": false
|
690 |
},
|
691 |
"99": {
|
692 |
+
"content": "ٻ",
|
693 |
"lstrip": false,
|
694 |
"normalized": true,
|
695 |
"rstrip": false,
|
|
|
697 |
"special": false
|
698 |
},
|
699 |
"100": {
|
700 |
+
"content": "—",
|
701 |
"lstrip": false,
|
702 |
"normalized": true,
|
703 |
"rstrip": false,
|
|
|
705 |
"special": false
|
706 |
},
|
707 |
"101": {
|
708 |
+
"content": " ",
|
709 |
"lstrip": false,
|
710 |
"normalized": true,
|
711 |
"rstrip": false,
|
|
|
713 |
"special": false
|
714 |
},
|
715 |
"102": {
|
716 |
+
"content": "ڍ",
|
717 |
"lstrip": false,
|
718 |
"normalized": true,
|
719 |
"rstrip": false,
|
|
|
721 |
"special": false
|
722 |
},
|
723 |
"103": {
|
724 |
+
"content": "ٿ",
|
725 |
"lstrip": false,
|
726 |
"normalized": true,
|
727 |
"rstrip": false,
|
|
|
729 |
"special": false
|
730 |
},
|
731 |
"104": {
|
732 |
+
"content": "ڱ",
|
733 |
"lstrip": false,
|
734 |
"normalized": true,
|
735 |
"rstrip": false,
|
|
|
737 |
"special": false
|
738 |
},
|
739 |
"105": {
|
740 |
+
"content": "ڙ",
|
741 |
"lstrip": false,
|
742 |
"normalized": true,
|
743 |
"rstrip": false,
|
|
|
745 |
"special": false
|
746 |
},
|
747 |
"106": {
|
748 |
+
"content": "ڇ",
|
749 |
"lstrip": false,
|
750 |
"normalized": true,
|
751 |
"rstrip": false,
|
|
|
753 |
"special": false
|
754 |
},
|
755 |
"107": {
|
756 |
+
"content": "۽",
|
757 |
"lstrip": false,
|
758 |
"normalized": true,
|
759 |
"rstrip": false,
|
|
|
761 |
"special": false
|
762 |
},
|
763 |
"108": {
|
764 |
+
"content": "ہ",
|
765 |
"lstrip": false,
|
766 |
"normalized": true,
|
767 |
"rstrip": false,
|
|
|
769 |
"special": false
|
770 |
},
|
771 |
"109": {
|
772 |
+
"content": "ڀ",
|
773 |
"lstrip": false,
|
774 |
"normalized": true,
|
775 |
"rstrip": false,
|
|
|
777 |
"special": false
|
778 |
},
|
779 |
"110": {
|
780 |
+
"content": "ڊ",
|
781 |
"lstrip": false,
|
782 |
"normalized": true,
|
783 |
"rstrip": false,
|
|
|
785 |
"special": false
|
786 |
},
|
787 |
"111": {
|
788 |
+
"content": "ں",
|
789 |
"lstrip": false,
|
790 |
"normalized": true,
|
791 |
"rstrip": false,
|
|
|
793 |
"special": false
|
794 |
},
|
795 |
"112": {
|
796 |
+
"content": "ڦ",
|
797 |
"lstrip": false,
|
798 |
"normalized": true,
|
799 |
"rstrip": false,
|
|
|
801 |
"special": false
|
802 |
},
|
803 |
"113": {
|
804 |
+
"content": "–",
|
805 |
"lstrip": false,
|
806 |
"normalized": true,
|
807 |
"rstrip": false,
|
|
|
809 |
"special": false
|
810 |
},
|
811 |
"114": {
|
812 |
+
"content": "’",
|
813 |
"lstrip": false,
|
814 |
"normalized": true,
|
815 |
"rstrip": false,
|
|
|
817 |
"special": false
|
818 |
},
|
819 |
"115": {
|
820 |
+
"content": "ڪ",
|
821 |
"lstrip": false,
|
822 |
"normalized": true,
|
823 |
"rstrip": false,
|
|
|
825 |
"special": false
|
826 |
},
|
827 |
"116": {
|
828 |
+
"content": "ڌ",
|
829 |
"lstrip": false,
|
830 |
"normalized": true,
|
831 |
"rstrip": false,
|
|
|
833 |
"special": false
|
834 |
},
|
835 |
"117": {
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
836 |
"content": "۾",
|
837 |
"lstrip": false,
|
838 |
"normalized": true,
|
839 |
"rstrip": false,
|
840 |
"single_word": false,
|
841 |
"special": false
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
842 |
}
|
843 |
},
|
844 |
"bos_token": "<s>",
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5368
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34ab21a90b32e29a6842c6e7e298a8a66827aa2bc93228f3cc8f403719f81262
|
3 |
size 5368
|