diff --git a/adalora_mlp/0.7.1.dev0/README.md b/adalora_mlp/0.7.1.dev0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8418790a9804519b45d7617c854594ede5dd4e13 --- /dev/null +++ b/adalora_mlp/0.7.1.dev0/README.md @@ -0,0 +1,203 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.7.1.dev0 \ No newline at end of file diff --git a/adalora_mlp/0.7.1.dev0/adapter_config.json b/adalora_mlp/0.7.1.dev0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..d2532652f0d11eb244c1c21e8dd7b4094b3ac330 --- /dev/null +++ b/adalora_mlp/0.7.1.dev0/adapter_config.json @@ -0,0 +1,37 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "MLP", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "beta1": 0.85, + "beta2": 0.85, + "bias": "none", + "deltaT": 1, + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "init_r": 12, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "orth_reg_weight": 0.5, + "peft_type": "ADALORA", + "r": 8, + "rank_pattern": null, + "revision": null, + "target_modules": [ + "lin0" + ], + "target_r": 8, + "task_type": null, + "tfinal": 0, + "tinit": 0, + "total_step": null +} \ No newline at end of file diff --git a/adalora_mlp/0.7.1.dev0/adapter_model.safetensors b/adalora_mlp/0.7.1.dev0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c32799fd7a49d57048e8c39080e9fd3851cf3463 --- /dev/null +++ b/adalora_mlp/0.7.1.dev0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5ea5ddc55a1efa998e7958cf23861145f047f09d6026f059de59b5102a2324b +size 1792 diff --git a/adalora_mlp/0.7.1.dev0/output.pt b/adalora_mlp/0.7.1.dev0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b0613a204186da9da8a73a481a6d8345a2dae90 --- /dev/null +++ b/adalora_mlp/0.7.1.dev0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf463d2e25f0620c63f2edba36fccbe7cd034399e3aea88daecbf1861c6c12c5 +size 1239 diff --git a/adalora_opt-350m/0.7.1.dev0/README.md b/adalora_opt-350m/0.7.1.dev0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..3013dbdb5845d0f1c5a91b496b5e83b762946353 --- /dev/null +++ b/adalora_opt-350m/0.7.1.dev0/README.md @@ -0,0 +1,204 @@ +--- +library_name: peft +base_model: facebook/opt-350m +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.7.1.dev0 \ No newline at end of file diff --git a/adalora_opt-350m/0.7.1.dev0/adapter_config.json b/adalora_opt-350m/0.7.1.dev0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e2886847569fac9dc9256b17ae3ac769711bb6cf --- /dev/null +++ b/adalora_opt-350m/0.7.1.dev0/adapter_config.json @@ -0,0 +1,42 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "OPTForCausalLM", + "parent_library": "transformers.models.opt.modeling_opt" + }, + "base_model_name_or_path": "facebook/opt-350m", + "beta1": 0.85, + "beta2": 0.85, + "bias": "none", + "deltaT": 1, + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "init_r": 12, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "orth_reg_weight": 0.5, + "peft_type": "ADALORA", + "r": 8, + "rank_pattern": null, + "revision": null, + "target_modules": [ + "q_proj", + "k_proj", + "v_proj", + "out_proj", + "fc1", + "fc2" + ], + "target_r": 8, + "task_type": null, + "tfinal": 0, + "tinit": 0, + "total_step": null +} \ No newline at end of file diff --git a/adalora_opt-350m/0.7.1.dev0/adapter_model.safetensors b/adalora_opt-350m/0.7.1.dev0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5021ebeb2f4529655b8d45fbd1cf1f3f68081906 --- /dev/null +++ b/adalora_opt-350m/0.7.1.dev0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5822a27af7248b4b2114160966628e30afcc872f5ebbf35055ab005f573afe95 +size 21296584 diff --git a/adalora_opt-350m/0.7.1.dev0/output.pt b/adalora_opt-350m/0.7.1.dev0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..55476b9db585883c229391a57d1c3ea0df3f711f --- /dev/null +++ b/adalora_opt-350m/0.7.1.dev0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94812c0896c14d17f786639e36e92121b565906296a9f00f870cc22bab2b9964 +size 1207639 diff --git a/ia3_conv2d/0.7.1.dev0/README.md b/ia3_conv2d/0.7.1.dev0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8418790a9804519b45d7617c854594ede5dd4e13 --- /dev/null +++ b/ia3_conv2d/0.7.1.dev0/README.md @@ -0,0 +1,203 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.7.1.dev0 \ No newline at end of file diff --git a/ia3_conv2d/0.7.1.dev0/adapter_config.json b/ia3_conv2d/0.7.1.dev0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..19ddf8909cf353a4926a1277a9e2b4b0ac49e5e6 --- /dev/null +++ b/ia3_conv2d/0.7.1.dev0/adapter_config.json @@ -0,0 +1,20 @@ +{ + "auto_mapping": { + "base_model_class": "ModelConv2D", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "fan_in_fan_out": false, + "feedforward_modules": [ + "conv2d" + ], + "inference_mode": true, + "init_ia3_weights": false, + "modules_to_save": null, + "peft_type": "IA3", + "revision": null, + "target_modules": [ + "conv2d" + ], + "task_type": null +} \ No newline at end of file diff --git a/ia3_conv2d/0.7.1.dev0/adapter_model.safetensors b/ia3_conv2d/0.7.1.dev0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fed0e83acacc555823c1c06e3025101a4ff23d9d --- /dev/null +++ b/ia3_conv2d/0.7.1.dev0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9345734e10567e6dbf5753e6c17a9136a5660f392cdec3edb620c4e1f04319d +size 148 diff --git a/ia3_conv2d/0.7.1.dev0/output.pt b/ia3_conv2d/0.7.1.dev0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..97abf21279b4d0c4091333adf1a028f6d25c58e7 --- /dev/null +++ b/ia3_conv2d/0.7.1.dev0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52919bd5ed67b71087614eb4e10245abaff4d23f281fd1bb883c1e8ca619f59c +size 1175 diff --git a/ia3_mlp/0.7.1.dev0/README.md b/ia3_mlp/0.7.1.dev0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8418790a9804519b45d7617c854594ede5dd4e13 --- /dev/null +++ b/ia3_mlp/0.7.1.dev0/README.md @@ -0,0 +1,203 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.7.1.dev0 \ No newline at end of file diff --git a/ia3_mlp/0.7.1.dev0/adapter_config.json b/ia3_mlp/0.7.1.dev0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e9707db75ebb2b2761f1cd3f7d61a70754f8694c --- /dev/null +++ b/ia3_mlp/0.7.1.dev0/adapter_config.json @@ -0,0 +1,20 @@ +{ + "auto_mapping": { + "base_model_class": "MLP", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "fan_in_fan_out": false, + "feedforward_modules": [ + "lin0" + ], + "inference_mode": true, + "init_ia3_weights": false, + "modules_to_save": null, + "peft_type": "IA3", + "revision": null, + "target_modules": [ + "lin0" + ], + "task_type": null +} \ No newline at end of file diff --git a/ia3_mlp/0.7.1.dev0/adapter_model.safetensors b/ia3_mlp/0.7.1.dev0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7536d7a0731a31c0e4279ef3d813f35ee14cc7ee --- /dev/null +++ b/ia3_mlp/0.7.1.dev0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ad391096a69dfb2259a7d15ec8876811caf751a2f0bbf914dc1d4a5b7fce81a +size 168 diff --git a/ia3_mlp/0.7.1.dev0/output.pt b/ia3_mlp/0.7.1.dev0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..a264d2c19f10227e459378aef5e611ca34ee6a01 --- /dev/null +++ b/ia3_mlp/0.7.1.dev0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c48c26cb5a4b979ca2680ef20339e99cd152289f43f9081804754b28f0b8cdd3 +size 1239 diff --git a/ia3_no_ff_mlp/0.7.1.dev0/README.md b/ia3_no_ff_mlp/0.7.1.dev0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8418790a9804519b45d7617c854594ede5dd4e13 --- /dev/null +++ b/ia3_no_ff_mlp/0.7.1.dev0/README.md @@ -0,0 +1,203 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.7.1.dev0 \ No newline at end of file diff --git a/ia3_no_ff_mlp/0.7.1.dev0/adapter_config.json b/ia3_no_ff_mlp/0.7.1.dev0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..32107143e57f3d6ca4a29d88ff21fc09323482d6 --- /dev/null +++ b/ia3_no_ff_mlp/0.7.1.dev0/adapter_config.json @@ -0,0 +1,18 @@ +{ + "auto_mapping": { + "base_model_class": "MLP", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "fan_in_fan_out": false, + "feedforward_modules": [], + "inference_mode": true, + "init_ia3_weights": false, + "modules_to_save": null, + "peft_type": "IA3", + "revision": null, + "target_modules": [ + "lin0" + ], + "task_type": null +} \ No newline at end of file diff --git a/ia3_no_ff_mlp/0.7.1.dev0/adapter_model.safetensors b/ia3_no_ff_mlp/0.7.1.dev0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..81f8c68952527805043c8cdc2a86b0f784bf6348 --- /dev/null +++ b/ia3_no_ff_mlp/0.7.1.dev0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5743c903d79e84431258c60a4b7ad84f576b76b6783ad0fed84a5916d5ca0c6 +size 208 diff --git a/ia3_no_ff_mlp/0.7.1.dev0/output.pt b/ia3_no_ff_mlp/0.7.1.dev0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7d1572f3d768a21b26c31fcf3301db7f1cbecc8 --- /dev/null +++ b/ia3_no_ff_mlp/0.7.1.dev0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f9a740f21bef2743dab177047bba223af7cadbf62841d6a168192c6e6c6fa01 +size 1239 diff --git a/ia3_opt-350m/0.7.1.dev0/README.md b/ia3_opt-350m/0.7.1.dev0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..3013dbdb5845d0f1c5a91b496b5e83b762946353 --- /dev/null +++ b/ia3_opt-350m/0.7.1.dev0/README.md @@ -0,0 +1,204 @@ +--- +library_name: peft +base_model: facebook/opt-350m +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.7.1.dev0 \ No newline at end of file diff --git a/ia3_opt-350m/0.7.1.dev0/adapter_config.json b/ia3_opt-350m/0.7.1.dev0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..aeb532c1953f75af535e6862d4d38872162b8169 --- /dev/null +++ b/ia3_opt-350m/0.7.1.dev0/adapter_config.json @@ -0,0 +1,22 @@ +{ + "auto_mapping": { + "base_model_class": "OPTForCausalLM", + "parent_library": "transformers.models.opt.modeling_opt" + }, + "base_model_name_or_path": "facebook/opt-350m", + "fan_in_fan_out": false, + "feedforward_modules": [ + "fc2" + ], + "inference_mode": true, + "init_ia3_weights": false, + "modules_to_save": null, + "peft_type": "IA3", + "revision": null, + "target_modules": [ + "q_proj", + "k_proj", + "fc2" + ], + "task_type": null +} \ No newline at end of file diff --git a/ia3_opt-350m/0.7.1.dev0/adapter_model.safetensors b/ia3_opt-350m/0.7.1.dev0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..167163af34f7658167454a899c99c80b50170dc5 --- /dev/null +++ b/ia3_opt-350m/0.7.1.dev0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c36d366cf7671c3513721c3e8b376c8b5f01d9a49d38273f66dc6c5fdd49c5b0 +size 598856 diff --git a/ia3_opt-350m/0.7.1.dev0/output.pt b/ia3_opt-350m/0.7.1.dev0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..a625fd76d6c5c35e01a9bd3389982c2ae65eea5c --- /dev/null +++ b/ia3_opt-350m/0.7.1.dev0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4118100e47db290f1d99c4433ea80ee466fb9353f11b8f51bc5dce5f3a611df +size 1207639 diff --git a/lora_conv2d/0.7.1.dev0/README.md b/lora_conv2d/0.7.1.dev0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8418790a9804519b45d7617c854594ede5dd4e13 --- /dev/null +++ b/lora_conv2d/0.7.1.dev0/README.md @@ -0,0 +1,203 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.7.1.dev0 \ No newline at end of file diff --git a/lora_conv2d/0.7.1.dev0/adapter_config.json b/lora_conv2d/0.7.1.dev0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..ebbc01f558887f0d788649d4a2cfcd004e6f6a74 --- /dev/null +++ b/lora_conv2d/0.7.1.dev0/adapter_config.json @@ -0,0 +1,28 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "ModelConv2D", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "conv2d" + ], + "task_type": null +} \ No newline at end of file diff --git a/lora_conv2d/0.7.1.dev0/adapter_model.safetensors b/lora_conv2d/0.7.1.dev0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6a94fb1d101a4c9afe37241108d1ad22b2a81b06 --- /dev/null +++ b/lora_conv2d/0.7.1.dev0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd9b1435a896564dff9bd097ac96ad1b330ab458a4d42fefb95f23a5e88d310e +size 2000 diff --git a/lora_conv2d/0.7.1.dev0/output.pt b/lora_conv2d/0.7.1.dev0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..adab21ee27e33931ca29417aed690c562d856f18 --- /dev/null +++ b/lora_conv2d/0.7.1.dev0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1133f060fa4c33a00d693a12f1ce5da805a7a83b8d103b91d0b243b9cd0f2a22 +size 1175 diff --git a/lora_emb_conv1d/0.7.1.dev0/README.md b/lora_emb_conv1d/0.7.1.dev0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8418790a9804519b45d7617c854594ede5dd4e13 --- /dev/null +++ b/lora_emb_conv1d/0.7.1.dev0/README.md @@ -0,0 +1,203 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.7.1.dev0 \ No newline at end of file diff --git a/lora_emb_conv1d/0.7.1.dev0/adapter_config.json b/lora_emb_conv1d/0.7.1.dev0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a8556a36902e893829ec889f74961dc414ce345c --- /dev/null +++ b/lora_emb_conv1d/0.7.1.dev0/adapter_config.json @@ -0,0 +1,29 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "ModelEmbConv1D", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "bias": "none", + "fan_in_fan_out": true, + "inference_mode": true, + "init_lora_weights": false, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "emb", + "conv1d" + ], + "task_type": null +} \ No newline at end of file diff --git a/lora_emb_conv1d/0.7.1.dev0/adapter_model.safetensors b/lora_emb_conv1d/0.7.1.dev0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4028422f51f0c110c684348db7e19c17a31fb0df --- /dev/null +++ b/lora_emb_conv1d/0.7.1.dev0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d1b535c7c7b3338f55c6c5b085b61d353d2a413f258bf6c4c05d5c8e6e00534 +size 3976 diff --git a/lora_emb_conv1d/0.7.1.dev0/output.pt b/lora_emb_conv1d/0.7.1.dev0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..347432c7352e0192fd673d3bfef17bf4e216cbb4 --- /dev/null +++ b/lora_emb_conv1d/0.7.1.dev0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7587645064a53bf568a92ecbc0e5f6f90fe84aa46c35402287b5d7bae3b4a015 +size 1239 diff --git a/lora_mlp/0.7.1.dev0/README.md b/lora_mlp/0.7.1.dev0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8418790a9804519b45d7617c854594ede5dd4e13 --- /dev/null +++ b/lora_mlp/0.7.1.dev0/README.md @@ -0,0 +1,203 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.7.1.dev0 \ No newline at end of file diff --git a/lora_mlp/0.7.1.dev0/adapter_config.json b/lora_mlp/0.7.1.dev0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..e2dbbfc69297aca18fe568eada8409a0d9efcaba --- /dev/null +++ b/lora_mlp/0.7.1.dev0/adapter_config.json @@ -0,0 +1,28 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "MLP", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "lin0" + ], + "task_type": null +} \ No newline at end of file diff --git a/lora_mlp/0.7.1.dev0/adapter_model.safetensors b/lora_mlp/0.7.1.dev0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..301daa9b8037d8ee8368917e2cdc0b85c7ef878f --- /dev/null +++ b/lora_mlp/0.7.1.dev0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dd16d2ccf171be88c29650a5780635f0418d21e8c74f7e4e919c3498e74d6a0 +size 1192 diff --git a/lora_mlp/0.7.1.dev0/output.pt b/lora_mlp/0.7.1.dev0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ff4325eb6753f08e69dcc759248e9d8c13319dd --- /dev/null +++ b/lora_mlp/0.7.1.dev0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50bcd27616ca78b6a55df1f21901d25ff81b4bcc4b8633e9de5456be9e76ede2 +size 1239 diff --git a/lora_mlp_modules_to_save/0.7.1.dev0/README.md b/lora_mlp_modules_to_save/0.7.1.dev0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8418790a9804519b45d7617c854594ede5dd4e13 --- /dev/null +++ b/lora_mlp_modules_to_save/0.7.1.dev0/README.md @@ -0,0 +1,203 @@ +--- +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.7.1.dev0 \ No newline at end of file diff --git a/lora_mlp_modules_to_save/0.7.1.dev0/adapter_config.json b/lora_mlp_modules_to_save/0.7.1.dev0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a57a7864c41b37046af8e41c980604832ec9c708 --- /dev/null +++ b/lora_mlp_modules_to_save/0.7.1.dev0/adapter_config.json @@ -0,0 +1,30 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "MLP", + "parent_library": "test_regression" + }, + "base_model_name_or_path": null, + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": [ + "lin1" + ], + "peft_type": "LORA", + "r": 8, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "lin0" + ], + "task_type": null +} \ No newline at end of file diff --git a/lora_mlp_modules_to_save/0.7.1.dev0/adapter_model.safetensors b/lora_mlp_modules_to_save/0.7.1.dev0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..165486bf6166a4e487501b4d70d4ae9f995ac004 --- /dev/null +++ b/lora_mlp_modules_to_save/0.7.1.dev0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c1939cb8cb41a8bb5f05238d37aa77d18d96d1d7a9d3afa6d6ff2d2ef9805ea +size 1528 diff --git a/lora_mlp_modules_to_save/0.7.1.dev0/output.pt b/lora_mlp_modules_to_save/0.7.1.dev0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ff4325eb6753f08e69dcc759248e9d8c13319dd --- /dev/null +++ b/lora_mlp_modules_to_save/0.7.1.dev0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50bcd27616ca78b6a55df1f21901d25ff81b4bcc4b8633e9de5456be9e76ede2 +size 1239 diff --git a/lora_opt-350m/0.7.1.dev0/README.md b/lora_opt-350m/0.7.1.dev0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..3013dbdb5845d0f1c5a91b496b5e83b762946353 --- /dev/null +++ b/lora_opt-350m/0.7.1.dev0/README.md @@ -0,0 +1,204 @@ +--- +library_name: peft +base_model: facebook/opt-350m +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +### Framework versions + +- PEFT 0.7.1.dev0 \ No newline at end of file diff --git a/lora_opt-350m/0.7.1.dev0/adapter_config.json b/lora_opt-350m/0.7.1.dev0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..dde2e701f8025807308da1ce7cb4f722491d082a --- /dev/null +++ b/lora_opt-350m/0.7.1.dev0/adapter_config.json @@ -0,0 +1,29 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "OPTForCausalLM", + "parent_library": "transformers.models.opt.modeling_opt" + }, + "base_model_name_or_path": "facebook/opt-350m", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "v_proj", + "q_proj" + ], + "task_type": null +} \ No newline at end of file diff --git a/lora_opt-350m/0.7.1.dev0/adapter_model.safetensors b/lora_opt-350m/0.7.1.dev0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4b5a55180d4444d976e7f9fd239c5d68f63a6173 --- /dev/null +++ b/lora_opt-350m/0.7.1.dev0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82751e30bebc19cbfa01212631d08c7032fc3a75996dadf4da1d29298fdd736f +size 3159096 diff --git a/lora_opt-350m/0.7.1.dev0/output.pt b/lora_opt-350m/0.7.1.dev0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..729029b97a9a9198394232b754853b7d2fbf602b --- /dev/null +++ b/lora_opt-350m/0.7.1.dev0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:788d8589a3e462ff482ff8926366f18b4bcf9c1d6af2bb1158eff483668645ef +size 1207639 diff --git a/lora_opt-350m_bnb_4bit/0.7.1.dev0/README.md b/lora_opt-350m_bnb_4bit/0.7.1.dev0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..a3db12c59f58680d5f587c674f9c35071779efde --- /dev/null +++ b/lora_opt-350m_bnb_4bit/0.7.1.dev0/README.md @@ -0,0 +1,218 @@ +--- +library_name: peft +base_model: facebook/opt-350m +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +## Training procedure + +The following `bitsandbytes` quantization config was used during training: +- quant_method: bitsandbytes +- load_in_8bit: False +- load_in_4bit: True +- llm_int8_threshold: 6.0 +- llm_int8_skip_modules: None +- llm_int8_enable_fp32_cpu_offload: False +- llm_int8_has_fp16_weight: False +- bnb_4bit_quant_type: fp4 +- bnb_4bit_use_double_quant: False +- bnb_4bit_compute_dtype: float32 + +### Framework versions + +- PEFT 0.7.1.dev0 \ No newline at end of file diff --git a/lora_opt-350m_bnb_4bit/0.7.1.dev0/adapter_config.json b/lora_opt-350m_bnb_4bit/0.7.1.dev0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..dde2e701f8025807308da1ce7cb4f722491d082a --- /dev/null +++ b/lora_opt-350m_bnb_4bit/0.7.1.dev0/adapter_config.json @@ -0,0 +1,29 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "OPTForCausalLM", + "parent_library": "transformers.models.opt.modeling_opt" + }, + "base_model_name_or_path": "facebook/opt-350m", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "v_proj", + "q_proj" + ], + "task_type": null +} \ No newline at end of file diff --git a/lora_opt-350m_bnb_4bit/0.7.1.dev0/adapter_model.safetensors b/lora_opt-350m_bnb_4bit/0.7.1.dev0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f87f3c2cced2e4736aa0481a818067ffa1b64558 --- /dev/null +++ b/lora_opt-350m_bnb_4bit/0.7.1.dev0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ece009e7ac28447a45cef4a37c5a4a0048b5a5b12261e37464fa762771b94a86 +size 3159096 diff --git a/lora_opt-350m_bnb_4bit/0.7.1.dev0/output.pt b/lora_opt-350m_bnb_4bit/0.7.1.dev0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7a1439eddc2a07109be26dbf66b9096c9855690 --- /dev/null +++ b/lora_opt-350m_bnb_4bit/0.7.1.dev0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00942ada33ef2fcbe9621268e1cce8c59aeeb71dd1c79101498d00c1881f07f5 +size 1207639 diff --git a/lora_opt-350m_bnb_8bit/0.7.1.dev0/README.md b/lora_opt-350m_bnb_8bit/0.7.1.dev0/README.md new file mode 100644 index 0000000000000000000000000000000000000000..3f0e497f64c92a7d1afb2e9d1bf0cbfeb4325896 --- /dev/null +++ b/lora_opt-350m_bnb_8bit/0.7.1.dev0/README.md @@ -0,0 +1,218 @@ +--- +library_name: peft +base_model: facebook/opt-350m +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] + + +## Training procedure + +The following `bitsandbytes` quantization config was used during training: +- quant_method: bitsandbytes +- load_in_8bit: True +- load_in_4bit: False +- llm_int8_threshold: 6.0 +- llm_int8_skip_modules: None +- llm_int8_enable_fp32_cpu_offload: False +- llm_int8_has_fp16_weight: False +- bnb_4bit_quant_type: fp4 +- bnb_4bit_use_double_quant: False +- bnb_4bit_compute_dtype: float32 + +### Framework versions + +- PEFT 0.7.1.dev0 \ No newline at end of file diff --git a/lora_opt-350m_bnb_8bit/0.7.1.dev0/adapter_config.json b/lora_opt-350m_bnb_8bit/0.7.1.dev0/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..dde2e701f8025807308da1ce7cb4f722491d082a --- /dev/null +++ b/lora_opt-350m_bnb_8bit/0.7.1.dev0/adapter_config.json @@ -0,0 +1,29 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "OPTForCausalLM", + "parent_library": "transformers.models.opt.modeling_opt" + }, + "base_model_name_or_path": "facebook/opt-350m", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": false, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "v_proj", + "q_proj" + ], + "task_type": null +} \ No newline at end of file diff --git a/lora_opt-350m_bnb_8bit/0.7.1.dev0/adapter_model.safetensors b/lora_opt-350m_bnb_8bit/0.7.1.dev0/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f87f3c2cced2e4736aa0481a818067ffa1b64558 --- /dev/null +++ b/lora_opt-350m_bnb_8bit/0.7.1.dev0/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ece009e7ac28447a45cef4a37c5a4a0048b5a5b12261e37464fa762771b94a86 +size 3159096 diff --git a/lora_opt-350m_bnb_8bit/0.7.1.dev0/output.pt b/lora_opt-350m_bnb_8bit/0.7.1.dev0/output.pt new file mode 100644 index 0000000000000000000000000000000000000000..36676c3eefb35372764e496e4df865dc1b3a1e97 --- /dev/null +++ b/lora_opt-350m_bnb_8bit/0.7.1.dev0/output.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1293fc3f775524733cbbc0febbba2e309af29451c8381c65b1057dbfb64a6dd3 +size 604375