diff --git a/adalora_mlp/0.6.2/README.md b/adalora_mlp/0.6.2/README.md new file mode 100644 index 0000000000000000000000000000000000000000..63ae1cbe8a669956cb256c817e716e9445e29c0d --- /dev/null +++ b/adalora_mlp/0.6.2/README.md @@ -0,0 +1,206 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +## Training procedure + + +### Framework versions + + +- PEFT 0.6.2 diff --git a/adalora_mlp/0.6.2/adapter_config.json b/adalora_mlp/0.6.2/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..b61742a1b83bd11c60da5383a3725fa1cb71eee6 --- /dev/null +++ b/adalora_mlp/0.6.2/adapter_config.json @@ -0,0 +1,34 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "MLP", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "beta1": 0.85, + "beta2": 0.85, + "bias": "none", + "deltaT": 1, + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "init_r": 12, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 8, + "lora_dropout": 0.0, + "modules_to_save": null, + "orth_reg_weight": 0.5, + "peft_type": "ADALORA", + "r": 8, + "rank_pattern": null, + "revision": null, + "target_modules": [ + "lin0" + ], + "target_r": 8, + "task_type": null, + "tfinal": 0, + "tinit": 0, + "total_step": null +} \ No newline at end of file diff --git a/adalora_mlp/0.6.2/adapter_model.safetensors b/adalora_mlp/0.6.2/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6116f819a347dc2bf1d208ebd84c6bb3f75e2ecb --- /dev/null +++ b/adalora_mlp/0.6.2/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9479f2503c55f4c63e0a5682c3855910de00377f39aee2ea9687412f45bb8d4 +size 1792 diff --git a/adalora_mlp/0.6.2/output.pt b/adalora_mlp/0.6.2/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd2dada906ff27a78cf0ea71ee6b2efa4db68d8d --- /dev/null +++ b/adalora_mlp/0.6.2/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c90d9caa327c2bc1237d69be84caaa5ea3b9110f3b0ef3036e3349bf528c97ee +size 1239 diff --git a/adalora_opt-350m/0.6.2/README.md b/adalora_opt-350m/0.6.2/README.md new file mode 100644 index 0000000000000000000000000000000000000000..1054ee4f0179053670a33097a2896e86bf117c6d --- /dev/null +++ b/adalora_opt-350m/0.6.2/README.md @@ -0,0 +1,207 @@ +--- +library_name: peft +base_model: facebook/opt-350m +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +## Training procedure + + +### Framework versions + + +- PEFT 0.6.2 diff --git a/adalora_opt-350m/0.6.2/adapter_config.json b/adalora_opt-350m/0.6.2/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1d5e38510b01919fedd93f5c2c5ca891cd8155b6 --- /dev/null +++ b/adalora_opt-350m/0.6.2/adapter_config.json @@ -0,0 +1,39 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "OPTForCausalLM", + "parent_library": "transformers.models.opt.modeling_opt" + }, + "base_model_name_or_path": "facebook/opt-350m", + "beta1": 0.85, + "beta2": 0.85, + "bias": "none", + "deltaT": 1, + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "init_r": 12, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 8, + "lora_dropout": 0.0, + "modules_to_save": null, + "orth_reg_weight": 0.5, + "peft_type": "ADALORA", + "r": 8, + "rank_pattern": null, + "revision": null, + "target_modules": [ + "q_proj", + "k_proj", + "v_proj", + "out_proj", + "fc1", + "fc2" + ], + "target_r": 8, + "task_type": null, + "tfinal": 0, + "tinit": 0, + "total_step": null +} \ No newline at end of file diff --git a/adalora_opt-350m/0.6.2/adapter_model.safetensors b/adalora_opt-350m/0.6.2/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d6c1846e56247b219f33da8680f6a2f45df0ce35 --- /dev/null +++ b/adalora_opt-350m/0.6.2/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b95942c9e2029d128034ec7ab28b882a763ccd18aa6dc0eb5c47dc66a89479ba +size 21296584 diff --git a/adalora_opt-350m/0.6.2/output.pt b/adalora_opt-350m/0.6.2/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..c314b6353fe4971ade3afec471ae7147d3e2db07 --- /dev/null +++ b/adalora_opt-350m/0.6.2/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45cd059248e254577130528f6b9b6ab434bda781523f9e33e6ba47c67b429ff8 +size 1207639 diff --git a/ia3_conv2d/0.6.2/README.md b/ia3_conv2d/0.6.2/README.md new file mode 100644 index 0000000000000000000000000000000000000000..63ae1cbe8a669956cb256c817e716e9445e29c0d --- /dev/null +++ b/ia3_conv2d/0.6.2/README.md @@ -0,0 +1,206 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +## Training procedure + + +### Framework versions + + +- PEFT 0.6.2 diff --git a/ia3_conv2d/0.6.2/adapter_config.json b/ia3_conv2d/0.6.2/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..19ddf8909cf353a4926a1277a9e2b4b0ac49e5e6 --- /dev/null +++ b/ia3_conv2d/0.6.2/adapter_config.json @@ -0,0 +1,20 @@ +{ + "auto_mapping": { + "base_model_class": "ModelConv2D", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "fan_in_fan_out": false, + "feedforward_modules": [ + "conv2d" + ], + "inference_mode": true, + "init_ia3_weights": false, + "modules_to_save": null, + "peft_type": "IA3", + "revision": null, + "target_modules": [ + "conv2d" + ], + "task_type": null +} \ No newline at end of file diff --git a/ia3_conv2d/0.6.2/adapter_model.safetensors b/ia3_conv2d/0.6.2/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ee8215388f28d471efd9340cb669b5aebe50a50b --- /dev/null +++ b/ia3_conv2d/0.6.2/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b3d25f99cd10353987666d320c8ae6f7a2e61129836888af543059a6d2233ed +size 148 diff --git a/ia3_conv2d/0.6.2/output.pt b/ia3_conv2d/0.6.2/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..84537ab214f0acf7cf3cd7aa206aa85b0dd1c696 --- /dev/null +++ b/ia3_conv2d/0.6.2/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6aeaa649528f43b5360de6d40aa805ac7bb1a9a98799172df77d04c21324a308 +size 1175 diff --git a/ia3_mlp/0.6.2/README.md b/ia3_mlp/0.6.2/README.md new file mode 100644 index 0000000000000000000000000000000000000000..63ae1cbe8a669956cb256c817e716e9445e29c0d --- /dev/null +++ b/ia3_mlp/0.6.2/README.md @@ -0,0 +1,206 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +## Training procedure + + +### Framework versions + + +- PEFT 0.6.2 diff --git a/ia3_mlp/0.6.2/adapter_config.json b/ia3_mlp/0.6.2/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e9707db75ebb2b2761f1cd3f7d61a70754f8694c --- /dev/null +++ b/ia3_mlp/0.6.2/adapter_config.json @@ -0,0 +1,20 @@ +{ + "auto_mapping": { + "base_model_class": "MLP", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "fan_in_fan_out": false, + "feedforward_modules": [ + "lin0" + ], + "inference_mode": true, + "init_ia3_weights": false, + "modules_to_save": null, + "peft_type": "IA3", + "revision": null, + "target_modules": [ + "lin0" + ], + "task_type": null +} \ No newline at end of file diff --git a/ia3_mlp/0.6.2/adapter_model.safetensors b/ia3_mlp/0.6.2/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..800ca50b5360c8d08298a7668be7b2302e3e3654 --- /dev/null +++ b/ia3_mlp/0.6.2/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f37cf4c827d5730fde053cc5e43926b7a329255bdf39a77b24d504d19ccda746 +size 168 diff --git a/ia3_mlp/0.6.2/output.pt b/ia3_mlp/0.6.2/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..f01d88bc75a2cbce983b1a104a9c0621b80e6b5d --- /dev/null +++ b/ia3_mlp/0.6.2/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d37ff05838c1628679f56a34b0e5c8e13f5cd9814216faa88d43a696dce9764 +size 1239 diff --git a/ia3_no_ff_mlp/0.6.2/README.md b/ia3_no_ff_mlp/0.6.2/README.md new file mode 100644 index 0000000000000000000000000000000000000000..63ae1cbe8a669956cb256c817e716e9445e29c0d --- /dev/null +++ b/ia3_no_ff_mlp/0.6.2/README.md @@ -0,0 +1,206 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +## Training procedure + + +### Framework versions + + +- PEFT 0.6.2 diff --git a/ia3_no_ff_mlp/0.6.2/adapter_config.json b/ia3_no_ff_mlp/0.6.2/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..32107143e57f3d6ca4a29d88ff21fc09323482d6 --- /dev/null +++ b/ia3_no_ff_mlp/0.6.2/adapter_config.json @@ -0,0 +1,18 @@ +{ + "auto_mapping": { + "base_model_class": "MLP", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "fan_in_fan_out": false, + "feedforward_modules": [], + "inference_mode": true, + "init_ia3_weights": false, + "modules_to_save": null, + "peft_type": "IA3", + "revision": null, + "target_modules": [ + "lin0" + ], + "task_type": null +} \ No newline at end of file diff --git a/ia3_no_ff_mlp/0.6.2/adapter_model.safetensors b/ia3_no_ff_mlp/0.6.2/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b1d1dc132521e44c08874d1d735878b2bace7942 --- /dev/null +++ b/ia3_no_ff_mlp/0.6.2/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dd84ea77e8fe4df72057bd6b5a02c633dae2afa33b6d7286f2859c5dd53a8c0 +size 208 diff --git a/ia3_no_ff_mlp/0.6.2/output.pt b/ia3_no_ff_mlp/0.6.2/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..700369572e0dac5e2ac3d60419088c74916d93ff --- /dev/null +++ b/ia3_no_ff_mlp/0.6.2/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6916d7bee023d39d11075986bb824a1569bffe25f855ddb956e95c56886a1164 +size 1239 diff --git a/ia3_opt-350m/0.6.2/README.md b/ia3_opt-350m/0.6.2/README.md new file mode 100644 index 0000000000000000000000000000000000000000..1054ee4f0179053670a33097a2896e86bf117c6d --- /dev/null +++ b/ia3_opt-350m/0.6.2/README.md @@ -0,0 +1,207 @@ +--- +library_name: peft +base_model: facebook/opt-350m +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +## Training procedure + + +### Framework versions + + +- PEFT 0.6.2 diff --git a/ia3_opt-350m/0.6.2/adapter_config.json b/ia3_opt-350m/0.6.2/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..aeb532c1953f75af535e6862d4d38872162b8169 --- /dev/null +++ b/ia3_opt-350m/0.6.2/adapter_config.json @@ -0,0 +1,22 @@ +{ + "auto_mapping": { + "base_model_class": "OPTForCausalLM", + "parent_library": "transformers.models.opt.modeling_opt" + }, + "base_model_name_or_path": "facebook/opt-350m", + "fan_in_fan_out": false, + "feedforward_modules": [ + "fc2" + ], + "inference_mode": true, + "init_ia3_weights": false, + "modules_to_save": null, + "peft_type": "IA3", + "revision": null, + "target_modules": [ + "q_proj", + "k_proj", + "fc2" + ], + "task_type": null +} \ No newline at end of file diff --git a/ia3_opt-350m/0.6.2/adapter_model.safetensors b/ia3_opt-350m/0.6.2/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d7a760dba37981e0692fbdb843d339e9d7d2f61f --- /dev/null +++ b/ia3_opt-350m/0.6.2/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7c93fe9f415a0f029daf4fd99656c672ad297586f1a82e61b0755a6861297c0 +size 598856 diff --git a/ia3_opt-350m/0.6.2/output.pt b/ia3_opt-350m/0.6.2/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd6d4747aa1fb4d01b170d9d3275f74decd56041 --- /dev/null +++ b/ia3_opt-350m/0.6.2/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:227dde8197b0422d4f0e6633b0b2f678a8f2602959003db4528e15e2b6b393ee +size 1207639 diff --git a/lora_conv2d/0.6.2/README.md b/lora_conv2d/0.6.2/README.md new file mode 100644 index 0000000000000000000000000000000000000000..63ae1cbe8a669956cb256c817e716e9445e29c0d --- /dev/null +++ b/lora_conv2d/0.6.2/README.md @@ -0,0 +1,206 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +## Training procedure + + +### Framework versions + + +- PEFT 0.6.2 diff --git a/lora_conv2d/0.6.2/adapter_config.json b/lora_conv2d/0.6.2/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1348e328b0e08f28ad8321eecec261850b426648 --- /dev/null +++ b/lora_conv2d/0.6.2/adapter_config.json @@ -0,0 +1,25 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "ModelConv2D", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 8, + "lora_dropout": 0.0, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "conv2d" + ], + "task_type": null +} \ No newline at end of file diff --git a/lora_conv2d/0.6.2/adapter_model.safetensors b/lora_conv2d/0.6.2/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6a94fb1d101a4c9afe37241108d1ad22b2a81b06 --- /dev/null +++ b/lora_conv2d/0.6.2/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd9b1435a896564dff9bd097ac96ad1b330ab458a4d42fefb95f23a5e88d310e +size 2000 diff --git a/lora_conv2d/0.6.2/output.pt b/lora_conv2d/0.6.2/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..adab21ee27e33931ca29417aed690c562d856f18 --- /dev/null +++ b/lora_conv2d/0.6.2/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1133f060fa4c33a00d693a12f1ce5da805a7a83b8d103b91d0b243b9cd0f2a22 +size 1175 diff --git a/lora_emb_conv1d/0.6.2/README.md b/lora_emb_conv1d/0.6.2/README.md new file mode 100644 index 0000000000000000000000000000000000000000..63ae1cbe8a669956cb256c817e716e9445e29c0d --- /dev/null +++ b/lora_emb_conv1d/0.6.2/README.md @@ -0,0 +1,206 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +## Training procedure + + +### Framework versions + + +- PEFT 0.6.2 diff --git a/lora_emb_conv1d/0.6.2/adapter_config.json b/lora_emb_conv1d/0.6.2/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..d4e2599816417114dc312d7e477d4317e7c73c63 --- /dev/null +++ b/lora_emb_conv1d/0.6.2/adapter_config.json @@ -0,0 +1,26 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "ModelEmbConv1D", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "bias": "none", + "fan_in_fan_out": true, + "inference_mode": true, + "init_lora_weights": false, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 8, + "lora_dropout": 0.0, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "emb", + "conv1d" + ], + "task_type": null +} \ No newline at end of file diff --git a/lora_emb_conv1d/0.6.2/adapter_model.safetensors b/lora_emb_conv1d/0.6.2/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4028422f51f0c110c684348db7e19c17a31fb0df --- /dev/null +++ b/lora_emb_conv1d/0.6.2/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d1b535c7c7b3338f55c6c5b085b61d353d2a413f258bf6c4c05d5c8e6e00534 +size 3976 diff --git a/lora_emb_conv1d/0.6.2/output.pt b/lora_emb_conv1d/0.6.2/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..347432c7352e0192fd673d3bfef17bf4e216cbb4 --- /dev/null +++ b/lora_emb_conv1d/0.6.2/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7587645064a53bf568a92ecbc0e5f6f90fe84aa46c35402287b5d7bae3b4a015 +size 1239 diff --git a/lora_mlp/0.6.2/README.md b/lora_mlp/0.6.2/README.md new file mode 100644 index 0000000000000000000000000000000000000000..63ae1cbe8a669956cb256c817e716e9445e29c0d --- /dev/null +++ b/lora_mlp/0.6.2/README.md @@ -0,0 +1,206 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +## Training procedure + + +### Framework versions + + +- PEFT 0.6.2 diff --git a/lora_mlp/0.6.2/adapter_config.json b/lora_mlp/0.6.2/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..60138a9f9d2f05efc121ef69012bb489bdf88845 --- /dev/null +++ b/lora_mlp/0.6.2/adapter_config.json @@ -0,0 +1,25 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "MLP", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 8, + "lora_dropout": 0.0, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "lin0" + ], + "task_type": null +} \ No newline at end of file diff --git a/lora_mlp/0.6.2/adapter_model.safetensors b/lora_mlp/0.6.2/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..301daa9b8037d8ee8368917e2cdc0b85c7ef878f --- /dev/null +++ b/lora_mlp/0.6.2/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dd16d2ccf171be88c29650a5780635f0418d21e8c74f7e4e919c3498e74d6a0 +size 1192 diff --git a/lora_mlp/0.6.2/output.pt b/lora_mlp/0.6.2/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ff4325eb6753f08e69dcc759248e9d8c13319dd --- /dev/null +++ b/lora_mlp/0.6.2/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50bcd27616ca78b6a55df1f21901d25ff81b4bcc4b8633e9de5456be9e76ede2 +size 1239 diff --git a/lora_mlp_modules_to_save/0.6.2/README.md b/lora_mlp_modules_to_save/0.6.2/README.md new file mode 100644 index 0000000000000000000000000000000000000000..63ae1cbe8a669956cb256c817e716e9445e29c0d --- /dev/null +++ b/lora_mlp_modules_to_save/0.6.2/README.md @@ -0,0 +1,206 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +## Training procedure + + +### Framework versions + + +- PEFT 0.6.2 diff --git a/lora_mlp_modules_to_save/0.6.2/adapter_config.json b/lora_mlp_modules_to_save/0.6.2/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a405866a81df5521548320801b07971ced2db288 --- /dev/null +++ b/lora_mlp_modules_to_save/0.6.2/adapter_config.json @@ -0,0 +1,27 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "MLP", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 8, + "lora_dropout": 0.0, + "modules_to_save": [ + "lin1" + ], + "peft_type": "LORA", + "r": 8, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "lin0" + ], + "task_type": null +} \ No newline at end of file diff --git a/lora_mlp_modules_to_save/0.6.2/adapter_model.safetensors b/lora_mlp_modules_to_save/0.6.2/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..165486bf6166a4e487501b4d70d4ae9f995ac004 --- /dev/null +++ b/lora_mlp_modules_to_save/0.6.2/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c1939cb8cb41a8bb5f05238d37aa77d18d96d1d7a9d3afa6d6ff2d2ef9805ea +size 1528 diff --git a/lora_mlp_modules_to_save/0.6.2/output.pt b/lora_mlp_modules_to_save/0.6.2/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ff4325eb6753f08e69dcc759248e9d8c13319dd --- /dev/null +++ b/lora_mlp_modules_to_save/0.6.2/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50bcd27616ca78b6a55df1f21901d25ff81b4bcc4b8633e9de5456be9e76ede2 +size 1239 diff --git a/lora_opt-350m/0.6.2/README.md b/lora_opt-350m/0.6.2/README.md new file mode 100644 index 0000000000000000000000000000000000000000..1054ee4f0179053670a33097a2896e86bf117c6d --- /dev/null +++ b/lora_opt-350m/0.6.2/README.md @@ -0,0 +1,207 @@ +--- +library_name: peft +base_model: facebook/opt-350m +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +## Training procedure + + +### Framework versions + + +- PEFT 0.6.2 diff --git a/lora_opt-350m/0.6.2/adapter_config.json b/lora_opt-350m/0.6.2/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..cf246fa1b026967eca3e0ebad0a9ee5277b2f237 --- /dev/null +++ b/lora_opt-350m/0.6.2/adapter_config.json @@ -0,0 +1,26 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "OPTForCausalLM", + "parent_library": "transformers.models.opt.modeling_opt" + }, + "base_model_name_or_path": "facebook/opt-350m", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 8, + "lora_dropout": 0.0, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": null +} \ No newline at end of file diff --git a/lora_opt-350m/0.6.2/adapter_model.safetensors b/lora_opt-350m/0.6.2/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4b5a55180d4444d976e7f9fd239c5d68f63a6173 --- /dev/null +++ b/lora_opt-350m/0.6.2/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82751e30bebc19cbfa01212631d08c7032fc3a75996dadf4da1d29298fdd736f +size 3159096 diff --git a/lora_opt-350m/0.6.2/output.pt b/lora_opt-350m/0.6.2/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..729029b97a9a9198394232b754853b7d2fbf602b --- /dev/null +++ b/lora_opt-350m/0.6.2/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:788d8589a3e462ff482ff8926366f18b4bcf9c1d6af2bb1158eff483668645ef +size 1207639 diff --git a/lora_opt-350m_bnb_4bit/0.6.2/README.md b/lora_opt-350m_bnb_4bit/0.6.2/README.md new file mode 100644 index 0000000000000000000000000000000000000000..2636783afb88ccc22ca00e13edb43da1e31533b1 --- /dev/null +++ b/lora_opt-350m_bnb_4bit/0.6.2/README.md @@ -0,0 +1,219 @@ +--- +library_name: peft +base_model: facebook/opt-350m +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +## Training procedure + + +The following `bitsandbytes` quantization config was used during training: +- quant_method: bitsandbytes +- load_in_8bit: False +- load_in_4bit: True +- llm_int8_threshold: 6.0 +- llm_int8_skip_modules: None +- llm_int8_enable_fp32_cpu_offload: False +- llm_int8_has_fp16_weight: False +- bnb_4bit_quant_type: fp4 +- bnb_4bit_use_double_quant: False +- bnb_4bit_compute_dtype: float32 + +### Framework versions + + +- PEFT 0.6.2 diff --git a/lora_opt-350m_bnb_4bit/0.6.2/adapter_config.json b/lora_opt-350m_bnb_4bit/0.6.2/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..cf246fa1b026967eca3e0ebad0a9ee5277b2f237 --- /dev/null +++ b/lora_opt-350m_bnb_4bit/0.6.2/adapter_config.json @@ -0,0 +1,26 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "OPTForCausalLM", + "parent_library": "transformers.models.opt.modeling_opt" + }, + "base_model_name_or_path": "facebook/opt-350m", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 8, + "lora_dropout": 0.0, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": null +} \ No newline at end of file diff --git a/lora_opt-350m_bnb_4bit/0.6.2/adapter_model.safetensors b/lora_opt-350m_bnb_4bit/0.6.2/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f87f3c2cced2e4736aa0481a818067ffa1b64558 --- /dev/null +++ b/lora_opt-350m_bnb_4bit/0.6.2/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ece009e7ac28447a45cef4a37c5a4a0048b5a5b12261e37464fa762771b94a86 +size 3159096 diff --git a/lora_opt-350m_bnb_4bit/0.6.2/output.pt b/lora_opt-350m_bnb_4bit/0.6.2/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7a1439eddc2a07109be26dbf66b9096c9855690 --- /dev/null +++ b/lora_opt-350m_bnb_4bit/0.6.2/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00942ada33ef2fcbe9621268e1cce8c59aeeb71dd1c79101498d00c1881f07f5 +size 1207639 diff --git a/lora_opt-350m_bnb_8bit/0.6.2/README.md b/lora_opt-350m_bnb_8bit/0.6.2/README.md new file mode 100644 index 0000000000000000000000000000000000000000..42be4973a991c2e68646bb40a67fe0887c596734 --- /dev/null +++ b/lora_opt-350m_bnb_8bit/0.6.2/README.md @@ -0,0 +1,219 @@ +--- +library_name: peft +base_model: facebook/opt-350m +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +## Training procedure + + +The following `bitsandbytes` quantization config was used during training: +- quant_method: bitsandbytes +- load_in_8bit: True +- load_in_4bit: False +- llm_int8_threshold: 6.0 +- llm_int8_skip_modules: None +- llm_int8_enable_fp32_cpu_offload: False +- llm_int8_has_fp16_weight: False +- bnb_4bit_quant_type: fp4 +- bnb_4bit_use_double_quant: False +- bnb_4bit_compute_dtype: float32 + +### Framework versions + + +- PEFT 0.6.2 diff --git a/lora_opt-350m_bnb_8bit/0.6.2/adapter_config.json b/lora_opt-350m_bnb_8bit/0.6.2/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..cf246fa1b026967eca3e0ebad0a9ee5277b2f237 --- /dev/null +++ b/lora_opt-350m_bnb_8bit/0.6.2/adapter_config.json @@ -0,0 +1,26 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "OPTForCausalLM", + "parent_library": "transformers.models.opt.modeling_opt" + }, + "base_model_name_or_path": "facebook/opt-350m", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 8, + "lora_dropout": 0.0, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": null +} \ No newline at end of file diff --git a/lora_opt-350m_bnb_8bit/0.6.2/adapter_model.safetensors b/lora_opt-350m_bnb_8bit/0.6.2/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f87f3c2cced2e4736aa0481a818067ffa1b64558 --- /dev/null +++ b/lora_opt-350m_bnb_8bit/0.6.2/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ece009e7ac28447a45cef4a37c5a4a0048b5a5b12261e37464fa762771b94a86 +size 3159096 diff --git a/lora_opt-350m_bnb_8bit/0.6.2/output.pt b/lora_opt-350m_bnb_8bit/0.6.2/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..36676c3eefb35372764e496e4df865dc1b3a1e97 --- /dev/null +++ b/lora_opt-350m_bnb_8bit/0.6.2/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1293fc3f775524733cbbc0febbba2e309af29451c8381c65b1057dbfb64a6dd3 +size 604375