diff --git a/adalora_mlp/0.10.0/README.md b/adalora_mlp/0.10.0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..68d37120621015861eb05e1bf0776c01fe47e59f --- /dev/null +++ b/adalora_mlp/0.10.0/README.md @@ -0,0 +1,203 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/adalora_mlp/0.10.0/adapter_config.json b/adalora_mlp/0.10.0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9afba9fc51dc621a16bf3d02a434d3c127f86603 --- /dev/null +++ b/adalora_mlp/0.10.0/adapter_config.json @@ -0,0 +1,40 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "MLP", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "beta1": 0.85, + "beta2": 0.85, + "bias": "none", + "deltaT": 1, + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "init_r": 12, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "orth_reg_weight": 0.5, + "peft_type": "ADALORA", + "r": 8, + "rank_pattern": null, + "revision": null, + "target_modules": [ + "lin0" + ], + "target_r": 8, + "task_type": null, + "tfinal": 0, + "tinit": 0, + "total_step": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/adalora_mlp/0.10.0/adapter_model.safetensors b/adalora_mlp/0.10.0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c32799fd7a49d57048e8c39080e9fd3851cf3463 --- /dev/null +++ b/adalora_mlp/0.10.0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5ea5ddc55a1efa998e7958cf23861145f047f09d6026f059de59b5102a2324b +size 1792 diff --git a/adalora_mlp/0.10.0/output.pt b/adalora_mlp/0.10.0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b0613a204186da9da8a73a481a6d8345a2dae90 --- /dev/null +++ b/adalora_mlp/0.10.0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf463d2e25f0620c63f2edba36fccbe7cd034399e3aea88daecbf1861c6c12c5 +size 1239 diff --git a/adalora_opt-350m/0.10.0/README.md b/adalora_opt-350m/0.10.0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..1e3e9240232c38665c4d82d282470bdb8df18e4f --- /dev/null +++ b/adalora_opt-350m/0.10.0/README.md @@ -0,0 +1,204 @@ +--- +library_name: peft +base_model: facebook/opt-350m +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/adalora_opt-350m/0.10.0/adapter_config.json b/adalora_opt-350m/0.10.0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..715cce0f14a83b685046e499c663f89812424ddb --- /dev/null +++ b/adalora_opt-350m/0.10.0/adapter_config.json @@ -0,0 +1,45 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "OPTForCausalLM", + "parent_library": "transformers.models.opt.modeling_opt" + }, + "base_model_name_or_path": "facebook/opt-350m", + "beta1": 0.85, + "beta2": 0.85, + "bias": "none", + "deltaT": 1, + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "init_r": 12, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "orth_reg_weight": 0.5, + "peft_type": "ADALORA", + "r": 8, + "rank_pattern": null, + "revision": null, + "target_modules": [ + "q_proj", + "k_proj", + "v_proj", + "out_proj", + "fc1", + "fc2" + ], + "target_r": 8, + "task_type": null, + "tfinal": 0, + "tinit": 0, + "total_step": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/adalora_opt-350m/0.10.0/adapter_model.safetensors b/adalora_opt-350m/0.10.0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2ca991a9c5ce9b5cb7c1261fc337c77da8574bd4 --- /dev/null +++ b/adalora_opt-350m/0.10.0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bb9b9604cb5fcf9119038b0104cafc4feda3310dd1eb1b22c6255d1480c5944 +size 21296584 diff --git a/adalora_opt-350m/0.10.0/output.pt b/adalora_opt-350m/0.10.0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..145a1f1f36e5b74a887ec1c710c96073c0218c3e --- /dev/null +++ b/adalora_opt-350m/0.10.0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fca8949df4312d0a0ec5d927dc9758affc6d1920af551ae25763c64a25f69633 +size 1207639 diff --git a/ia3_conv2d/0.10.0/README.md b/ia3_conv2d/0.10.0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..68d37120621015861eb05e1bf0776c01fe47e59f --- /dev/null +++ b/ia3_conv2d/0.10.0/README.md @@ -0,0 +1,203 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/ia3_conv2d/0.10.0/adapter_config.json b/ia3_conv2d/0.10.0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..19ddf8909cf353a4926a1277a9e2b4b0ac49e5e6 --- /dev/null +++ b/ia3_conv2d/0.10.0/adapter_config.json @@ -0,0 +1,20 @@ +{ + "auto_mapping": { + "base_model_class": "ModelConv2D", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "fan_in_fan_out": false, + "feedforward_modules": [ + "conv2d" + ], + "inference_mode": true, + "init_ia3_weights": false, + "modules_to_save": null, + "peft_type": "IA3", + "revision": null, + "target_modules": [ + "conv2d" + ], + "task_type": null +} \ No newline at end of file diff --git a/ia3_conv2d/0.10.0/adapter_model.safetensors b/ia3_conv2d/0.10.0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fed0e83acacc555823c1c06e3025101a4ff23d9d --- /dev/null +++ b/ia3_conv2d/0.10.0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9345734e10567e6dbf5753e6c17a9136a5660f392cdec3edb620c4e1f04319d +size 148 diff --git a/ia3_conv2d/0.10.0/output.pt b/ia3_conv2d/0.10.0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..97abf21279b4d0c4091333adf1a028f6d25c58e7 --- /dev/null +++ b/ia3_conv2d/0.10.0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52919bd5ed67b71087614eb4e10245abaff4d23f281fd1bb883c1e8ca619f59c +size 1175 diff --git a/ia3_mlp/0.10.0/README.md b/ia3_mlp/0.10.0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..68d37120621015861eb05e1bf0776c01fe47e59f --- /dev/null +++ b/ia3_mlp/0.10.0/README.md @@ -0,0 +1,203 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/ia3_mlp/0.10.0/adapter_config.json b/ia3_mlp/0.10.0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e9707db75ebb2b2761f1cd3f7d61a70754f8694c --- /dev/null +++ b/ia3_mlp/0.10.0/adapter_config.json @@ -0,0 +1,20 @@ +{ + "auto_mapping": { + "base_model_class": "MLP", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "fan_in_fan_out": false, + "feedforward_modules": [ + "lin0" + ], + "inference_mode": true, + "init_ia3_weights": false, + "modules_to_save": null, + "peft_type": "IA3", + "revision": null, + "target_modules": [ + "lin0" + ], + "task_type": null +} \ No newline at end of file diff --git a/ia3_mlp/0.10.0/adapter_model.safetensors b/ia3_mlp/0.10.0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7536d7a0731a31c0e4279ef3d813f35ee14cc7ee --- /dev/null +++ b/ia3_mlp/0.10.0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ad391096a69dfb2259a7d15ec8876811caf751a2f0bbf914dc1d4a5b7fce81a +size 168 diff --git a/ia3_mlp/0.10.0/output.pt b/ia3_mlp/0.10.0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..a264d2c19f10227e459378aef5e611ca34ee6a01 --- /dev/null +++ b/ia3_mlp/0.10.0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c48c26cb5a4b979ca2680ef20339e99cd152289f43f9081804754b28f0b8cdd3 +size 1239 diff --git a/ia3_no_ff_mlp/0.10.0/README.md b/ia3_no_ff_mlp/0.10.0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..68d37120621015861eb05e1bf0776c01fe47e59f --- /dev/null +++ b/ia3_no_ff_mlp/0.10.0/README.md @@ -0,0 +1,203 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/ia3_no_ff_mlp/0.10.0/adapter_config.json b/ia3_no_ff_mlp/0.10.0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..32107143e57f3d6ca4a29d88ff21fc09323482d6 --- /dev/null +++ b/ia3_no_ff_mlp/0.10.0/adapter_config.json @@ -0,0 +1,18 @@ +{ + "auto_mapping": { + "base_model_class": "MLP", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "fan_in_fan_out": false, + "feedforward_modules": [], + "inference_mode": true, + "init_ia3_weights": false, + "modules_to_save": null, + "peft_type": "IA3", + "revision": null, + "target_modules": [ + "lin0" + ], + "task_type": null +} \ No newline at end of file diff --git a/ia3_no_ff_mlp/0.10.0/adapter_model.safetensors b/ia3_no_ff_mlp/0.10.0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..81f8c68952527805043c8cdc2a86b0f784bf6348 --- /dev/null +++ b/ia3_no_ff_mlp/0.10.0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5743c903d79e84431258c60a4b7ad84f576b76b6783ad0fed84a5916d5ca0c6 +size 208 diff --git a/ia3_no_ff_mlp/0.10.0/output.pt b/ia3_no_ff_mlp/0.10.0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7d1572f3d768a21b26c31fcf3301db7f1cbecc8 --- /dev/null +++ b/ia3_no_ff_mlp/0.10.0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f9a740f21bef2743dab177047bba223af7cadbf62841d6a168192c6e6c6fa01 +size 1239 diff --git a/ia3_opt-350m/0.10.0/README.md b/ia3_opt-350m/0.10.0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..1e3e9240232c38665c4d82d282470bdb8df18e4f --- /dev/null +++ b/ia3_opt-350m/0.10.0/README.md @@ -0,0 +1,204 @@ +--- +library_name: peft +base_model: facebook/opt-350m +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/ia3_opt-350m/0.10.0/adapter_config.json b/ia3_opt-350m/0.10.0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..aeb532c1953f75af535e6862d4d38872162b8169 --- /dev/null +++ b/ia3_opt-350m/0.10.0/adapter_config.json @@ -0,0 +1,22 @@ +{ + "auto_mapping": { + "base_model_class": "OPTForCausalLM", + "parent_library": "transformers.models.opt.modeling_opt" + }, + "base_model_name_or_path": "facebook/opt-350m", + "fan_in_fan_out": false, + "feedforward_modules": [ + "fc2" + ], + "inference_mode": true, + "init_ia3_weights": false, + "modules_to_save": null, + "peft_type": "IA3", + "revision": null, + "target_modules": [ + "q_proj", + "k_proj", + "fc2" + ], + "task_type": null +} \ No newline at end of file diff --git a/ia3_opt-350m/0.10.0/adapter_model.safetensors b/ia3_opt-350m/0.10.0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5c36b729476b2981d2bf493f95ed8d996ecfe69f --- /dev/null +++ b/ia3_opt-350m/0.10.0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a81de1816feef77f280dd0098df77723c7d289fc1f3f9d787becb6fa41afc22 +size 598856 diff --git a/ia3_opt-350m/0.10.0/output.pt b/ia3_opt-350m/0.10.0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca35df52df5ec22c7f5e1ab37fc48f696c9bb9d2 --- /dev/null +++ b/ia3_opt-350m/0.10.0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74ff512a2c5983b95dbe3e7bf19690f28cd45ce23283713d9dfb54ca47bd5f08 +size 1207639 diff --git a/lora_conv2d/0.10.0/README.md b/lora_conv2d/0.10.0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..68d37120621015861eb05e1bf0776c01fe47e59f --- /dev/null +++ b/lora_conv2d/0.10.0/README.md @@ -0,0 +1,203 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/lora_conv2d/0.10.0/adapter_config.json b/lora_conv2d/0.10.0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..dc6f9c7f60998c86aba9ccbd915ea98ff2a188dc --- /dev/null +++ b/lora_conv2d/0.10.0/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "ModelConv2D", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "conv2d" + ], + "task_type": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/lora_conv2d/0.10.0/adapter_model.safetensors b/lora_conv2d/0.10.0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6a94fb1d101a4c9afe37241108d1ad22b2a81b06 --- /dev/null +++ b/lora_conv2d/0.10.0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd9b1435a896564dff9bd097ac96ad1b330ab458a4d42fefb95f23a5e88d310e +size 2000 diff --git a/lora_conv2d/0.10.0/output.pt b/lora_conv2d/0.10.0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..adab21ee27e33931ca29417aed690c562d856f18 --- /dev/null +++ b/lora_conv2d/0.10.0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1133f060fa4c33a00d693a12f1ce5da805a7a83b8d103b91d0b243b9cd0f2a22 +size 1175 diff --git a/lora_emb_conv1d/0.10.0/README.md b/lora_emb_conv1d/0.10.0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..68d37120621015861eb05e1bf0776c01fe47e59f --- /dev/null +++ b/lora_emb_conv1d/0.10.0/README.md @@ -0,0 +1,203 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/lora_emb_conv1d/0.10.0/adapter_config.json b/lora_emb_conv1d/0.10.0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..af9f5a13b0bacdf3e4d1437279ed9716f7cd9374 --- /dev/null +++ b/lora_emb_conv1d/0.10.0/adapter_config.json @@ -0,0 +1,32 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "ModelEmbConv1D", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "bias": "none", + "fan_in_fan_out": true, + "inference_mode": true, + "init_lora_weights": false, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "emb", + "conv1d" + ], + "task_type": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/lora_emb_conv1d/0.10.0/adapter_model.safetensors b/lora_emb_conv1d/0.10.0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4028422f51f0c110c684348db7e19c17a31fb0df --- /dev/null +++ b/lora_emb_conv1d/0.10.0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d1b535c7c7b3338f55c6c5b085b61d353d2a413f258bf6c4c05d5c8e6e00534 +size 3976 diff --git a/lora_emb_conv1d/0.10.0/output.pt b/lora_emb_conv1d/0.10.0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..347432c7352e0192fd673d3bfef17bf4e216cbb4 --- /dev/null +++ b/lora_emb_conv1d/0.10.0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7587645064a53bf568a92ecbc0e5f6f90fe84aa46c35402287b5d7bae3b4a015 +size 1239 diff --git a/lora_mlp/0.10.0/README.md b/lora_mlp/0.10.0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..68d37120621015861eb05e1bf0776c01fe47e59f --- /dev/null +++ b/lora_mlp/0.10.0/README.md @@ -0,0 +1,203 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/lora_mlp/0.10.0/adapter_config.json b/lora_mlp/0.10.0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..97a77d16107d9251f2d787e3552b0df1c2e0aab7 --- /dev/null +++ b/lora_mlp/0.10.0/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "MLP", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "lin0" + ], + "task_type": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/lora_mlp/0.10.0/adapter_model.safetensors b/lora_mlp/0.10.0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..301daa9b8037d8ee8368917e2cdc0b85c7ef878f --- /dev/null +++ b/lora_mlp/0.10.0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dd16d2ccf171be88c29650a5780635f0418d21e8c74f7e4e919c3498e74d6a0 +size 1192 diff --git a/lora_mlp/0.10.0/output.pt b/lora_mlp/0.10.0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ff4325eb6753f08e69dcc759248e9d8c13319dd --- /dev/null +++ b/lora_mlp/0.10.0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50bcd27616ca78b6a55df1f21901d25ff81b4bcc4b8633e9de5456be9e76ede2 +size 1239 diff --git a/lora_mlp_modules_to_save/0.10.0/README.md b/lora_mlp_modules_to_save/0.10.0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..68d37120621015861eb05e1bf0776c01fe47e59f --- /dev/null +++ b/lora_mlp_modules_to_save/0.10.0/README.md @@ -0,0 +1,203 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/lora_mlp_modules_to_save/0.10.0/adapter_config.json b/lora_mlp_modules_to_save/0.10.0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..4f88a523ed97ecbfcab4c3e60514afd4a81f2267 --- /dev/null +++ b/lora_mlp_modules_to_save/0.10.0/adapter_config.json @@ -0,0 +1,33 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "MLP", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": [ + "lin1" + ], + "peft_type": "LORA", + "r": 8, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "lin0" + ], + "task_type": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/lora_mlp_modules_to_save/0.10.0/adapter_model.safetensors b/lora_mlp_modules_to_save/0.10.0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..165486bf6166a4e487501b4d70d4ae9f995ac004 --- /dev/null +++ b/lora_mlp_modules_to_save/0.10.0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c1939cb8cb41a8bb5f05238d37aa77d18d96d1d7a9d3afa6d6ff2d2ef9805ea +size 1528 diff --git a/lora_mlp_modules_to_save/0.10.0/output.pt b/lora_mlp_modules_to_save/0.10.0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ff4325eb6753f08e69dcc759248e9d8c13319dd --- /dev/null +++ b/lora_mlp_modules_to_save/0.10.0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50bcd27616ca78b6a55df1f21901d25ff81b4bcc4b8633e9de5456be9e76ede2 +size 1239 diff --git a/lora_opt-350m/0.10.0/README.md b/lora_opt-350m/0.10.0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..1e3e9240232c38665c4d82d282470bdb8df18e4f --- /dev/null +++ b/lora_opt-350m/0.10.0/README.md @@ -0,0 +1,204 @@ +--- +library_name: peft +base_model: facebook/opt-350m +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/lora_opt-350m/0.10.0/adapter_config.json b/lora_opt-350m/0.10.0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..49ff81620f8afbf673a67e86d41cca3464920e05 --- /dev/null +++ b/lora_opt-350m/0.10.0/adapter_config.json @@ -0,0 +1,32 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "OPTForCausalLM", + "parent_library": "transformers.models.opt.modeling_opt" + }, + "base_model_name_or_path": "facebook/opt-350m", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "v_proj", + "q_proj" + ], + "task_type": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/lora_opt-350m/0.10.0/adapter_model.safetensors b/lora_opt-350m/0.10.0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f87f3c2cced2e4736aa0481a818067ffa1b64558 --- /dev/null +++ b/lora_opt-350m/0.10.0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ece009e7ac28447a45cef4a37c5a4a0048b5a5b12261e37464fa762771b94a86 +size 3159096 diff --git a/lora_opt-350m/0.10.0/output.pt b/lora_opt-350m/0.10.0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f713a24401b24ae82952fecd454c5976d1e336f --- /dev/null +++ b/lora_opt-350m/0.10.0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:429c9016c3f9c6a01edfe736061be7d9d85f9cb1c3088de58e9121b8c1bce0d8 +size 1207639 diff --git a/lora_opt-350m_bnb_4bit/0.10.0/README.md b/lora_opt-350m_bnb_4bit/0.10.0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..1e3e9240232c38665c4d82d282470bdb8df18e4f --- /dev/null +++ b/lora_opt-350m_bnb_4bit/0.10.0/README.md @@ -0,0 +1,204 @@ +--- +library_name: peft +base_model: facebook/opt-350m +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/lora_opt-350m_bnb_4bit/0.10.0/adapter_config.json b/lora_opt-350m_bnb_4bit/0.10.0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..49ff81620f8afbf673a67e86d41cca3464920e05 --- /dev/null +++ b/lora_opt-350m_bnb_4bit/0.10.0/adapter_config.json @@ -0,0 +1,32 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "OPTForCausalLM", + "parent_library": "transformers.models.opt.modeling_opt" + }, + "base_model_name_or_path": "facebook/opt-350m", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "v_proj", + "q_proj" + ], + "task_type": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/lora_opt-350m_bnb_4bit/0.10.0/adapter_model.safetensors b/lora_opt-350m_bnb_4bit/0.10.0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f87f3c2cced2e4736aa0481a818067ffa1b64558 --- /dev/null +++ b/lora_opt-350m_bnb_4bit/0.10.0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ece009e7ac28447a45cef4a37c5a4a0048b5a5b12261e37464fa762771b94a86 +size 3159096 diff --git a/lora_opt-350m_bnb_4bit/0.10.0/output.pt b/lora_opt-350m_bnb_4bit/0.10.0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..b118e5d6781a00eafc25233b573e4cedffb81eed --- /dev/null +++ b/lora_opt-350m_bnb_4bit/0.10.0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b464cd9d9104b1a9baab040edc8380fa44239ccd9924116e22e581c262860bba +size 1207639 diff --git a/lora_opt-350m_bnb_8bit/0.10.0/README.md b/lora_opt-350m_bnb_8bit/0.10.0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..1e3e9240232c38665c4d82d282470bdb8df18e4f --- /dev/null +++ b/lora_opt-350m_bnb_8bit/0.10.0/README.md @@ -0,0 +1,204 @@ +--- +library_name: peft +base_model: facebook/opt-350m +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/lora_opt-350m_bnb_8bit/0.10.0/adapter_config.json b/lora_opt-350m_bnb_8bit/0.10.0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..49ff81620f8afbf673a67e86d41cca3464920e05 --- /dev/null +++ b/lora_opt-350m_bnb_8bit/0.10.0/adapter_config.json @@ -0,0 +1,32 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "OPTForCausalLM", + "parent_library": "transformers.models.opt.modeling_opt" + }, + "base_model_name_or_path": "facebook/opt-350m", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "v_proj", + "q_proj" + ], + "task_type": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/lora_opt-350m_bnb_8bit/0.10.0/adapter_model.safetensors b/lora_opt-350m_bnb_8bit/0.10.0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f87f3c2cced2e4736aa0481a818067ffa1b64558 --- /dev/null +++ b/lora_opt-350m_bnb_8bit/0.10.0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ece009e7ac28447a45cef4a37c5a4a0048b5a5b12261e37464fa762771b94a86 +size 3159096 diff --git a/lora_opt-350m_bnb_8bit/0.10.0/output.pt b/lora_opt-350m_bnb_8bit/0.10.0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..36676c3eefb35372764e496e4df865dc1b3a1e97 --- /dev/null +++ b/lora_opt-350m_bnb_8bit/0.10.0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1293fc3f775524733cbbc0febbba2e309af29451c8381c65b1057dbfb64a6dd3 +size 604375