diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-100/README.md b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-100/README.md new file mode 100644 index 0000000000000000000000000000000000000000..62416b37ed9e5040f71c81b7df78b7cc4f978ac9 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-100/README.md @@ -0,0 +1,202 @@ +--- +base_model: /share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.13.2 \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-100/adapter_config.json b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-100/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1044f62e37b2504f1f866e908e43fcad6e9bab4f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-100/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "/share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "c_attn", + "attn.c_proj", + "w1", + "w2" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-100/adapter_model.safetensors b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-100/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b61533ae24c8449531a8daeed4a90e6d5b43f92f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-100/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1578c865726923bb16dd42af5ec1787782bd71c3e9ed341694de61739ebc2c81 +size 448823864 diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-1000/README.md b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-1000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..62416b37ed9e5040f71c81b7df78b7cc4f978ac9 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-1000/README.md @@ -0,0 +1,202 @@ +--- +base_model: /share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.13.2 \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-1000/adapter_config.json b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-1000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1044f62e37b2504f1f866e908e43fcad6e9bab4f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-1000/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "/share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "c_attn", + "attn.c_proj", + "w1", + "w2" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-1000/adapter_model.safetensors b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-1000/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6972fc33430b0811eeeb98d198986f786307c937 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-1000/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:940b6de56409177e43a86bda6b6f4a99925b931ed8e7b2d24454561bea4ba0a8 +size 448823864 diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-150/README.md b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-150/README.md new file mode 100644 index 0000000000000000000000000000000000000000..62416b37ed9e5040f71c81b7df78b7cc4f978ac9 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-150/README.md @@ -0,0 +1,202 @@ +--- +base_model: /share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.13.2 \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-150/adapter_config.json b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-150/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1044f62e37b2504f1f866e908e43fcad6e9bab4f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-150/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "/share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "c_attn", + "attn.c_proj", + "w1", + "w2" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-150/adapter_model.safetensors b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-150/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a9c4118fc1ef7f2c21154d858ff72706959474c7 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-150/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d600e73f45adc21d4f18133beb4c9c00da5d17197f7cc0f2e4cc535647a1dec0 +size 448823864 diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-200/README.md b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-200/README.md new file mode 100644 index 0000000000000000000000000000000000000000..62416b37ed9e5040f71c81b7df78b7cc4f978ac9 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-200/README.md @@ -0,0 +1,202 @@ +--- +base_model: /share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.13.2 \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-200/adapter_config.json b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-200/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1044f62e37b2504f1f866e908e43fcad6e9bab4f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-200/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "/share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "c_attn", + "attn.c_proj", + "w1", + "w2" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-200/adapter_model.safetensors b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-200/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1b2b07e0be788e416892a1b996a2edfb9c6d0945 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-200/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d9e9b1fc8ce6f6968c0d4372723107e5c46c6370ca65c67e56c0077bc407426 +size 448823864 diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-250/README.md b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-250/README.md new file mode 100644 index 0000000000000000000000000000000000000000..62416b37ed9e5040f71c81b7df78b7cc4f978ac9 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-250/README.md @@ -0,0 +1,202 @@ +--- +base_model: /share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.13.2 \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-250/adapter_config.json b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-250/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1044f62e37b2504f1f866e908e43fcad6e9bab4f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-250/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "/share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "c_attn", + "attn.c_proj", + "w1", + "w2" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-250/adapter_model.safetensors b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-250/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d21a2e3b7edd2c465f03197eda2fe2bf09da9bbc --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-250/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:184cc8940ce05fd19d2f72559358cdc036cdbbc80396c952d8197ee1bb25f136 +size 448823864 diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-300/README.md b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-300/README.md new file mode 100644 index 0000000000000000000000000000000000000000..62416b37ed9e5040f71c81b7df78b7cc4f978ac9 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-300/README.md @@ -0,0 +1,202 @@ +--- +base_model: /share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.13.2 \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-300/adapter_config.json b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-300/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1044f62e37b2504f1f866e908e43fcad6e9bab4f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-300/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "/share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "c_attn", + "attn.c_proj", + "w1", + "w2" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-300/adapter_model.safetensors b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-300/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e417c997a55bdb8d52579e1c423158b1d341e80e --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-300/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:186993e11d81596ddd06f6f864dd053f5d673f78182b2b0fdd646f5c96070010 +size 448823864 diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-350/README.md b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-350/README.md new file mode 100644 index 0000000000000000000000000000000000000000..62416b37ed9e5040f71c81b7df78b7cc4f978ac9 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-350/README.md @@ -0,0 +1,202 @@ +--- +base_model: /share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.13.2 \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-350/adapter_config.json b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-350/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1044f62e37b2504f1f866e908e43fcad6e9bab4f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-350/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "/share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "c_attn", + "attn.c_proj", + "w1", + "w2" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-350/adapter_model.safetensors b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-350/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4909bd0d916d16318637fea47f91e01d14570021 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-350/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:848aff0938546a62f20b5cb9727db2eb08132e442a2945dc225b463d05ff7163 +size 448823864 diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-400/README.md b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-400/README.md new file mode 100644 index 0000000000000000000000000000000000000000..62416b37ed9e5040f71c81b7df78b7cc4f978ac9 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-400/README.md @@ -0,0 +1,202 @@ +--- +base_model: /share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.13.2 \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-400/adapter_config.json b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-400/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1044f62e37b2504f1f866e908e43fcad6e9bab4f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-400/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "/share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "c_attn", + "attn.c_proj", + "w1", + "w2" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-400/adapter_model.safetensors b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-400/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..37b8b5c7a9c5e731c042af3619ad6ce09d959b0b --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-400/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:054294d39abc70d9ae83cda933762c2a2af45eea563628cb32ad7e61bd0b398e +size 448823864 diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-450/README.md b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-450/README.md new file mode 100644 index 0000000000000000000000000000000000000000..62416b37ed9e5040f71c81b7df78b7cc4f978ac9 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-450/README.md @@ -0,0 +1,202 @@ +--- +base_model: /share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.13.2 \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-450/adapter_config.json b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-450/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1044f62e37b2504f1f866e908e43fcad6e9bab4f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-450/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "/share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "c_attn", + "attn.c_proj", + "w1", + "w2" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-450/adapter_model.safetensors b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-450/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b2012355946e7be85f53b69b3e3ca38ddce98a20 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-450/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1147d57c474b2f5f3bc9bfe8bb9e3cfa38c6f16950888485939dc94dfc6685d7 +size 448823864 diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-50/README.md b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-50/README.md new file mode 100644 index 0000000000000000000000000000000000000000..62416b37ed9e5040f71c81b7df78b7cc4f978ac9 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-50/README.md @@ -0,0 +1,202 @@ +--- +base_model: /share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.13.2 \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-50/adapter_config.json b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-50/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1044f62e37b2504f1f866e908e43fcad6e9bab4f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-50/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "/share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "c_attn", + "attn.c_proj", + "w1", + "w2" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-50/adapter_model.safetensors b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-50/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3ee3d1f1adbd421637537b90bcdaad309496a71b --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-50/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c3a233e0dfa54892146ee389d23109bfee5cd0f5df7d7bd1bc3a0db428d0fba +size 448823864 diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-500/README.md b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-500/README.md new file mode 100644 index 0000000000000000000000000000000000000000..62416b37ed9e5040f71c81b7df78b7cc4f978ac9 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-500/README.md @@ -0,0 +1,202 @@ +--- +base_model: /share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.13.2 \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-500/adapter_config.json b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-500/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1044f62e37b2504f1f866e908e43fcad6e9bab4f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-500/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "/share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "c_attn", + "attn.c_proj", + "w1", + "w2" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-500/adapter_model.safetensors b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-500/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8cabd834cbe6e81fc7963f2ccad1bfda5af9cb6f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-500/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aded28d9ebb22b51295344a2ead9adff806843f64e8f18525079e5d0faff7d17 +size 448823864 diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-550/README.md b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-550/README.md new file mode 100644 index 0000000000000000000000000000000000000000..62416b37ed9e5040f71c81b7df78b7cc4f978ac9 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-550/README.md @@ -0,0 +1,202 @@ +--- +base_model: /share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.13.2 \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-550/adapter_config.json b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-550/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1044f62e37b2504f1f866e908e43fcad6e9bab4f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-550/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "/share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "c_attn", + "attn.c_proj", + "w1", + "w2" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-550/adapter_model.safetensors b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-550/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e1cea4769364df5a1d014b4f40cacfc7a76fa300 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-550/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:933f3718db6f88b1a68c82201e3fb9a20cd0d3cea60e04e391446884719e0039 +size 448823864 diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-600/README.md b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-600/README.md new file mode 100644 index 0000000000000000000000000000000000000000..62416b37ed9e5040f71c81b7df78b7cc4f978ac9 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-600/README.md @@ -0,0 +1,202 @@ +--- +base_model: /share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.13.2 \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-600/adapter_config.json b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-600/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1044f62e37b2504f1f866e908e43fcad6e9bab4f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-600/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "/share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "c_attn", + "attn.c_proj", + "w1", + "w2" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-600/adapter_model.safetensors b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-600/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2fcacb3855366e35614a93d0714cc9ba2afdab40 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-600/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c23ab300efaa5a3ed1b4611154aa7c7cf779587361f8445f265e2d5e9b27aa29 +size 448823864 diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-650/README.md b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-650/README.md new file mode 100644 index 0000000000000000000000000000000000000000..62416b37ed9e5040f71c81b7df78b7cc4f978ac9 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-650/README.md @@ -0,0 +1,202 @@ +--- +base_model: /share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.13.2 \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-650/adapter_config.json b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-650/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1044f62e37b2504f1f866e908e43fcad6e9bab4f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-650/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "/share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "c_attn", + "attn.c_proj", + "w1", + "w2" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-650/adapter_model.safetensors b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-650/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..de27a60ce68bee74f4f1b9e500498d50538f1e9f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-650/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21313cd4e34f6be84021da88acc271fb20c97e01bc5d93d1fbca78c056497a76 +size 448823864 diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-700/README.md b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-700/README.md new file mode 100644 index 0000000000000000000000000000000000000000..62416b37ed9e5040f71c81b7df78b7cc4f978ac9 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-700/README.md @@ -0,0 +1,202 @@ +--- +base_model: /share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.13.2 \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-700/adapter_config.json b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-700/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1044f62e37b2504f1f866e908e43fcad6e9bab4f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-700/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "/share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "c_attn", + "attn.c_proj", + "w1", + "w2" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-700/adapter_model.safetensors b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-700/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f7e74fc65f0201742f6be2d334c2bb2bfa6b50d0 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-700/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71f9668a24d536dfc150e530bccd31039ae49c9f6f2ad43e212bbcf551b15c1a +size 448823864 diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-750/README.md b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-750/README.md new file mode 100644 index 0000000000000000000000000000000000000000..62416b37ed9e5040f71c81b7df78b7cc4f978ac9 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-750/README.md @@ -0,0 +1,202 @@ +--- +base_model: /share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.13.2 \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-750/adapter_config.json b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-750/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1044f62e37b2504f1f866e908e43fcad6e9bab4f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-750/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "/share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "c_attn", + "attn.c_proj", + "w1", + "w2" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-750/adapter_model.safetensors b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-750/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f19a7d0d36e3e5ef019593a07daf702dd65a7121 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-750/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a115b3ba9024d724b7d4523848098c04e1c82a7c71770f9dcd89c8cd5d960f5 +size 448823864 diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-800/README.md b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-800/README.md new file mode 100644 index 0000000000000000000000000000000000000000..62416b37ed9e5040f71c81b7df78b7cc4f978ac9 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-800/README.md @@ -0,0 +1,202 @@ +--- +base_model: /share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.13.2 \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-800/adapter_config.json b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-800/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1044f62e37b2504f1f866e908e43fcad6e9bab4f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-800/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "/share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "c_attn", + "attn.c_proj", + "w1", + "w2" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-800/adapter_model.safetensors b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-800/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bf52aa3a6dba0088913747766ff5685c8b67207b --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-800/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80bc6abc9f583f53c341d440fdc3fdc3153815b546582fdc4fe75415e027595b +size 448823864 diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-850/README.md b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-850/README.md new file mode 100644 index 0000000000000000000000000000000000000000..62416b37ed9e5040f71c81b7df78b7cc4f978ac9 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-850/README.md @@ -0,0 +1,202 @@ +--- +base_model: /share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.13.2 \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-850/adapter_config.json b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-850/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1044f62e37b2504f1f866e908e43fcad6e9bab4f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-850/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "/share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "c_attn", + "attn.c_proj", + "w1", + "w2" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-850/adapter_model.safetensors b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-850/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0fda1c0b924b30e962553e81470373d7958dc97d --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-850/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b37065c91e463a60493e0d25099c028a87484a6e5b00909173b8b266472295e +size 448823864 diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-900/README.md b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-900/README.md new file mode 100644 index 0000000000000000000000000000000000000000..62416b37ed9e5040f71c81b7df78b7cc4f978ac9 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-900/README.md @@ -0,0 +1,202 @@ +--- +base_model: /share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.13.2 \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-900/adapter_config.json b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-900/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1044f62e37b2504f1f866e908e43fcad6e9bab4f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-900/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "/share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "c_attn", + "attn.c_proj", + "w1", + "w2" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-900/adapter_model.safetensors b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-900/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..44c4094cbefe832448f8fdd7ec4616086f11c481 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-900/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97b70f821884c718636db112b8991d48688727f23c6a3c2a95f880efc3f68d7e +size 448823864 diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-950/README.md b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-950/README.md new file mode 100644 index 0000000000000000000000000000000000000000..62416b37ed9e5040f71c81b7df78b7cc4f978ac9 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-950/README.md @@ -0,0 +1,202 @@ +--- +base_model: /share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.13.2 \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-950/adapter_config.json b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-950/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1044f62e37b2504f1f866e908e43fcad6e9bab4f --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-950/adapter_config.json @@ -0,0 +1,31 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "/share/ssddata/sarimhashmi/mimic_vqa/Qwen-VL-Chat", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "c_attn", + "attn.c_proj", + "w1", + "w2" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-950/adapter_model.safetensors b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-950/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..67c6b7d0d8478b19e6d4ebbb28a7ed293784ae66 --- /dev/null +++ b/qwenvlceweights/ce_qwen_vl_weights/checkpoint-batch-950/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc098ea627d8dc7e02353ebfc0297227317342099df5e830221013f765c04a69 +size 448823864