Upload folder using huggingface_hub

Browse files

Files changed (8) hide show

config.json +128 -0
info.log +0 -0
labels.vocab +60 -0
pytorch_model.bin +3 -0
tokenizer/special_tokens_map.json +1 -0
tokenizer/tokenizer_config.json +1 -0
tokenizer/vocab.txt +0 -0
transformer.json +21 -0

config.json ADDED Viewed

	@@ -0,0 +1,128 @@

+{
+    "experiment": "ota_boun",
+    "name": "bert-base-turkish-cased",
+    "n_gpu": 1,
+    "model": {
+        "type": "MultiParser",
+        "args": {
+            "embeddings_processor": {
+                "type": "BertWrapper",
+                "args": {
+                    "model_path": "data/pretrained_embeddings/bert-base-turkish-cased-nonpretrained",
+                    "fine_tune": true,
+                    "hidden_dropout": 0.2,
+                    "attn_dropout": 0.2,
+                    "output_dropout": 0.5,
+                    "scalar_mix_layer_dropout": 0.1,
+                    "token_mask_prob": 0.15
+                }
+            },
+            "outputs": {
+                "heads": {
+                    "type": "ArcScorer",
+                    "args": {
+                        "scorer_class": "DeepBiaffineScorer",
+                        "head_mode": "single_head",
+                        "hidden_size": 768,
+                        "dropout": 0.33,
+                        "vocab": {
+                            "type": "IntegerVocab"
+                        }
+                    }
+                },
+                "labels": {
+                    "type": "DependencyClassifier",
+                    "args": {
+                        "scorer_class": "DeepBiaffineScorer",
+                        "hidden_size": 256,
+                        "dropout": 0.33,
+                        "vocab": {
+                            "type": "BasicVocab",
+                            "args": {
+                                "vocab_filename": "data/corpora/ota_boun/vocab/basic.vocab"
+                            }
+                        }
+                    }
+                }
+            },
+            "post_processors": [
+                {
+                    "type": "FactorizedMSTPostProcessor",
+                    "args": {
+                        "annotation_ids": [
+                            "heads",
+                            "labels"
+                        ]
+                    }
+                }
+            ]
+        }
+    },
+    "data_loaders": {
+        "type": "BucketedCONLLLoader",
+        "args": {
+            "annotation_layers": {
+                "heads": {
+                    "type": "TagSequence",
+                    "source_column": 6,
+                    "args": {
+                        "ignore_root": true
+                    }
+                },
+                "labels": {
+                    "type": "DependencyMatrix",
+                    "source_column": [
+                        6,
+                        7
+                    ],
+                    "args": {
+                        "ignore_non_relations": true
+                    }
+                }
+            },
+            "batch_size": 32,
+            "bucket_size": 256,
+            "max_tokens_per_batch": 156800,
+            "num_workers": 2
+        },
+        "paths": {
+            "train": "data/corpora/ota_boun/ota_boun-ud-train.conllu",
+            "dev": "data/corpora/ota_boun/ota_boun-ud-test.conllu",
+            "test": "data/corpora/ota_boun/tr_boun-ud-test.conllu"
+        }
+    },
+    "trainer": {
+        "min_epochs": 15,
+        "max_epochs": 300,
+        "early_stop": 15,
+        "save_dir": "data/saved_models/",
+        "save_period": 20,
+        "verbosity": 2,
+        "validation_criterion": {
+            "metrics": {
+                "heads": "fscore",
+                "labels": "fscore"
+            },
+            "weighting": "multiplicative"
+        },
+        "optimizer": {
+            "type": "AdamW",
+            "args": {
+                "lr": 4e-05,
+                "weight_decay": 0.0
+            }
+        },
+        "lr_scheduler": {
+            "type": "LambdaLR",
+            "args": {
+                "lr_lambda": "SqrtSchedule(400)"
+            }
+        },
+        "loss": {
+            "type": "CrossEntropyLoss",
+            "args": {
+                "ignore_index": -1
+            }
+        }
+    }
+}

info.log ADDED Viewed

The diff for this file is too large to render. See raw diff

labels.vocab ADDED Viewed

	@@ -0,0 +1,60 @@

+root
+case
+det
+obl
+nsubj
+punct
+flat
+obj
+advcl
+nummod
+mark
+amod
+nmod
+compound
+advmod
+nsubj:pass
+aux
+aux:pass
+acl
+conj
+obl:tmod
+cc
+det:predet
+cop
+nmod:poss
+ccomp
+parataxis
+expl
+flat:foreign
+xcomp
+csubj
+fixed
+acl:relcl
+appos
+compound:prt
+iobj
+nmod:tmod
+obl:npmod
+cc:preconj
+reparandum
+vocative
+discourse
+goeswith
+list
+nmod:npmod
+orphan
+dep
+csubj:pass
+dislocated
+compound:lvc
+advmod:emph
+obl:agent
+compound:redup
+aux:q
+clf
+csubj:outer
+dep:der
+discourse:q
+nmod:part
+nsubj:outer

pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8e1c1cd47eff0dc4b0698f0835b48c99415147495373fca4d27fc030e41c5c19
+size 1396526621

tokenizer/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}

tokenizer/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"do_lower_case": false, "max_len": 512, "special_tokens_map_file": null, "full_tokenizer_file": null}

tokenizer/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

transformer.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "architectures": [
+    "BertModel"
+  ],
+  "attention_probs_dropout_prob": 0.2,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.2,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "output_hidden_states": true,
+  "pad_token_id": 0,
+  "type_vocab_size": 2,
+  "vocab_size": 32000
+}