From e7e61cc46df325b543098e3fd7dc37902b55b215 Mon Sep 17 00:00:00 2001 From: Arnaud J Le Hors Date: Wed, 27 Nov 2024 09:13:43 +0100 Subject: [PATCH] Latest batch of model updates Signed-off-by: Arnaud J Le Hors --- models/Aquila-VL-2B.yml | 117 ++++++++++++++++++++++++++++++++++++ models/Jiang-Base.yml | 117 ++++++++++++++++++++++++++++++++++++ models/Jurassic-1-Jumbo.yml | 116 +++++++++++++++++++++++++++++++++++ models/MiniCPM3-4B.yml | 116 +++++++++++++++++++++++++++++++++++ "models/PanGu-\316\261.yml" | 116 +++++++++++++++++++++++++++++++++++ models/StellarX-4B-V0.yml | 117 ++++++++++++++++++++++++++++++++++++ 6 files changed, 699 insertions(+) create mode 100644 models/Aquila-VL-2B.yml create mode 100644 models/Jiang-Base.yml create mode 100644 models/Jurassic-1-Jumbo.yml create mode 100644 models/MiniCPM3-4B.yml create mode 100644 "models/PanGu-\316\261.yml" create mode 100644 models/StellarX-4B-V0.yml diff --git a/models/Aquila-VL-2B.yml b/models/Aquila-VL-2B.yml new file mode 100644 index 0000000..3248749 --- /dev/null +++ b/models/Aquila-VL-2B.yml @@ -0,0 +1,117 @@ +framework: + name: 'Model Openness Framework' + version: '1.0' + date: '2024-12-15' +release: + name: Aquila-VL-2B + version: 2.18B + date: '2024-11-22' + type: multimodal + architecture: 'transformer decoder' + origin: 'Qwen2.5-1.5B-instruct ' + producer: 'Beijing Academy of Artificial Intelligence(BAAl)' + contact: 403969556@qq.com + huggingface: 'https://huggingface.co/https://huggingface.co/BAAI/Aquila-VL-2B-llava-qwen' + components: + - + name: 'Model architecture' + description: "Well commented code for the model's architecture" + location: 'https://huggingface.co/Qwen/Qwen2.5-1.5B-Instruct' + license_name: Apache-2.0 + license_path: 'https://huggingface.co/Qwen/Qwen2.5-1.5B-Instruct/blob/main/LICENSE' + - + name: 'Data preprocessing code' + description: 'Code for data cleansing, normalization, and augmentation' + location: 'https://huggingface.co/datasets/BAAI/Infinity-MM/tree/main/preprocessing' + license_name: Apache-2.0 + license_path: 'https://huggingface.co/datasets/choosealicense/licenses/blob/main/markdown/apache-2.0.md' + - + name: 'Training code' + description: 'Code used for training the model' + location: 'https://github.com/LLaVA-VL/LLaVA-NeXT' + license_name: Apache-2.0 + license_path: 'https://github.com/LLaVA-VL/LLaVA-NeXT?tab=Apache-2.0-1-ov-file' + - + name: 'Inference code' + description: 'Code used for running the model to make predictions' + location: 'https://github.com/LLaVA-VL/LLaVA-NeXT' + license_name: Apache-2.0 + license_path: 'https://github.com/LLaVA-VL/LLaVA-NeXT?tab=Apache-2.0-1-ov-file' + - + name: 'Evaluation code' + description: 'Code used for evaluating the model' + location: 'https://github.com/open-compass/VLMEvalKit?tab=Apache-2.0-1-ov-file' + license_name: Apache-2.0 + license_path: 'https://github.com/open-compass/VLMEvalKit?tab=Apache-2.0-1-ov-file' + - + name: 'Supporting libraries and tools' + description: "Libraries and tools used in the model's development" + location: 'https://github.com/huggingface/transformers' + license_name: Apache-2.0 + license_path: 'https://github.com/huggingface/transformers?tab=Apache-2.0-1-ov-file' + - + name: 'Model parameters (Final)' + description: 'Trained model parameters, weights and biases' + location: 'https://huggingface.co/BAAI/Aquila-VL-2B-llava-qwen' + license_name: Apache-2.0 + license_path: 'https://huggingface.co/datasets/choosealicense/licenses/blob/main/markdown/apache-2.0.md' + - + name: 'Model parameters (Intermediate)' + description: 'Trained model parameters, weights and biases' + location: 'https://huggingface.co/BAAI/Aquila-VL-2B-Intermediate' + license_name: CDLA-Permissive-2.0 + license_path: 'https://huggingface.co/datasets/choosealicense/licenses/blob/main/markdown/apache-2.0.md' + - + name: Datasets + description: 'Training, validation and testing datasets used for the model' + location: 'https://huggingface.co/datasets/BAAI/Infinity-MM' + license_name: CC-BY-4.0 + license_path: 'https://choosealicense.com/licenses/cc-by-sa-4.0/' + - + name: 'Evaluation data' + description: 'Data used for evaluating the model' + location: 'https://github.com/open-compass/VLMEvalKit?tab=Apache-2.0-1-ov-file' + license_name: CDLA-Permissive-2.0 + license_path: 'https://github.com/open-compass/VLMEvalKit?tab=Apache-2.0-1-ov-file' + - + name: 'Model metadata' + description: 'Any model metadata including training configuration and optimizer states' + location: '' + license_name: 'Component not included' + license_path: '' + - + name: 'Sample model outputs' + description: 'Examples of outputs generated by the model' + location: '' + license_name: 'Component not included' + license_path: '' + - + name: 'Model card' + description: 'Model details including performance metrics, intended use, and limitations' + location: 'https://huggingface.co/BAAI/Aquila-VL-2B-llava-qwen' + license_name: Apache-2.0 + license_path: 'https://choosealicense.com/licenses/apache-2.0/' + - + name: 'Data card' + description: 'Documentation for datasets including source, characteristics, and preprocessing details' + location: 'https://huggingface.co/datasets/BAAI/Infinity-MM' + license_name: CC-BY-4.0 + license_path: 'https://choosealicense.com/licenses/cc-by-sa-4.0/' + - + name: 'Technical report' + description: 'Technical report detailing capabilities and usage instructions for the model' + location: 'https://arxiv.org/abs/2410.18558' + license_name: CC-BY-4.0 + license_path: 'https://creativecommons.org/licenses/by/4.0/' + - + name: 'Research paper' + description: 'Research paper detailing the development and capabilities of the model' + location: 'https://arxiv.org/abs/2410.18558' + license_name: CC-BY-4.0 + license_path: 'https://creativecommons.org/licenses/by/4.0/' + - + name: 'Evaluation results' + description: 'The results from evaluating the model' + location: 'https://huggingface.co/BAAI/Aquila-VL-2B-llava-qwen' + license_name: Apache-2.0 + license_path: 'https://choosealicense.com/licenses/apache-2.0/' diff --git a/models/Jiang-Base.yml b/models/Jiang-Base.yml new file mode 100644 index 0000000..4f72206 --- /dev/null +++ b/models/Jiang-Base.yml @@ -0,0 +1,117 @@ +framework: + name: 'Model Openness Framework' + version: '1.0' + date: '2024-12-15' +release: + name: Jiang-Base + version: 30B + date: '2024-11-14' + type: language + architecture: 'transformer decoder' + origin: '' + producer: KDF + contact: '' + huggingface: 'https://huggingface.co/kdf/jiang-base' + components: + - + name: 'Model architecture' + description: "Well commented code for the model's architecture" + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: 'Data preprocessing code' + description: 'Code for data cleansing, normalization, and augmentation' + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: 'Training code' + description: 'Code used for training the model' + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: 'Inference code' + description: 'Code used for running the model to make predictions' + location: '' + license_name: apache-2.0 + license_path: '' + - + name: 'Evaluation code' + description: 'Code used for evaluating the model' + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: 'Supporting libraries and tools' + description: "Libraries and tools used in the model's development" + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: 'Model parameters (Final)' + description: 'Trained model parameters, weights and biases' + location: '' + license_name: 'License not specified' + license_path: '' + - + name: 'Model parameters (Intermediate)' + description: 'Trained model parameters, weights and biases' + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: Datasets + description: 'Training, validation and testing datasets used for the model' + location: '' + license_name: 'License not specified' + license_path: '' + - + name: 'Evaluation data' + description: 'Data used for evaluating the model' + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: 'Model metadata' + description: 'Any model metadata including training configuration and optimizer states' + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: 'Sample model outputs' + description: 'Examples of outputs generated by the model' + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: 'Model card' + description: 'Model details including performance metrics, intended use, and limitations' + location: '' + license_name: 'License not specified' + license_path: '' + - + name: 'Data card' + description: 'Documentation for datasets including source, characteristics, and preprocessing details' + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: 'Technical report' + description: 'Technical report detailing capabilities and usage instructions for the model' + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: 'Research paper' + description: 'Research paper detailing the development and capabilities of the model' + location: '' + license_name: 'License not specified' + license_path: '' + - + name: 'Evaluation results' + description: 'The results from evaluating the model' + location: '' + license_name: 'License not specified' + license_path: '' diff --git a/models/Jurassic-1-Jumbo.yml b/models/Jurassic-1-Jumbo.yml new file mode 100644 index 0000000..2363461 --- /dev/null +++ b/models/Jurassic-1-Jumbo.yml @@ -0,0 +1,116 @@ +framework: + name: 'Model Openness Framework' + version: '1.0' + date: '2024-12-15' +release: + name: Jurassic-1-Jumbo + version: 178B + date: '2024-11-14' + type: language + architecture: 'transformer decoder' + origin: '' + producer: 'AI21 Labs' + contact: '' + components: + - + name: 'Model architecture' + description: "Well commented code for the model's architecture" + location: '' + license_name: 'License not specified' + license_path: '' + - + name: 'Data preprocessing code' + description: 'Code for data cleansing, normalization, and augmentation' + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: 'Training code' + description: 'Code used for training the model' + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: 'Inference code' + description: 'Code used for running the model to make predictions' + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: 'Evaluation code' + description: 'Code used for evaluating the model' + location: '' + license_name: 'License not specified' + license_path: '' + - + name: 'Supporting libraries and tools' + description: "Libraries and tools used in the model's development" + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: 'Model parameters (Final)' + description: 'Trained model parameters, weights and biases' + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: 'Model parameters (Intermediate)' + description: 'Trained model parameters, weights and biases' + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: Datasets + description: 'Training, validation and testing datasets used for the model' + location: '' + license_name: 'License not specified' + license_path: '' + - + name: 'Evaluation data' + description: 'Data used for evaluating the model' + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: 'Model metadata' + description: 'Any model metadata including training configuration and optimizer states' + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: 'Sample model outputs' + description: 'Examples of outputs generated by the model' + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: 'Model card' + description: 'Model details including performance metrics, intended use, and limitations' + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: 'Data card' + description: 'Documentation for datasets including source, characteristics, and preprocessing details' + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: 'Technical report' + description: 'Technical report detailing capabilities and usage instructions for the model' + location: '' + license_name: 'Component Not Included' + license_path: '' + - + name: 'Research paper' + description: 'Research paper detailing the development and capabilities of the model' + location: '' + license_name: 'License not specified' + license_path: '' + - + name: 'Evaluation results' + description: 'The results from evaluating the model' + location: '' + license_name: 'License not specified' + license_path: '' diff --git a/models/MiniCPM3-4B.yml b/models/MiniCPM3-4B.yml new file mode 100644 index 0000000..7f893c0 --- /dev/null +++ b/models/MiniCPM3-4B.yml @@ -0,0 +1,116 @@ +framework: + name: 'Model Openness Framework' + version: '1.0' + date: '2024-12-15' +release: + name: 'MiniCPM3-4B ' + version: 4B + date: '2024-11-14' + type: language + architecture: decoder + origin: '' + producer: OpenBMB + contact: '' + components: + - + name: 'Model architecture' + description: "Well commented code for the model's architecture" + location: '' + license_name: 'License not specified' + license_path: '' + - + name: 'Data preprocessing code' + description: 'Code for data cleansing, normalization, and augmentation' + location: '' + license_name: 'Component not included' + license_path: '' + - + name: 'Training code' + description: 'Code used for training the model' + location: '' + license_name: 'Component not included' + license_path: '' + - + name: 'Inference code' + description: 'Code used for running the model to make predictions' + location: '' + license_name: Apache-2.0 + license_path: '' + - + name: 'Evaluation code' + description: 'Code used for evaluating the model' + location: '' + license_name: 'Component not included' + license_path: '' + - + name: 'Supporting libraries and tools' + description: "Libraries and tools used in the model's development" + location: '' + license_name: Apache-2.0 + license_path: '' + - + name: 'Model parameters (Final)' + description: 'Trained model parameters, weights and biases' + location: '' + license_name: 'Component not included' + license_path: '' + - + name: 'Model parameters (Intermediate)' + description: 'Trained model parameters, weights and biases' + location: '' + license_name: 'Component not included' + license_path: '' + - + name: Datasets + description: 'Training, validation and testing datasets used for the model' + location: '' + license_name: 'Component not included' + license_path: '' + - + name: 'Evaluation data' + description: 'Data used for evaluating the model' + location: '' + license_name: 'Component not included' + license_path: '' + - + name: 'Model metadata' + description: 'Any model metadata including training configuration and optimizer states' + location: '' + license_name: 'Component not included' + license_path: '' + - + name: 'Sample model outputs' + description: 'Examples of outputs generated by the model' + location: '' + license_name: 'Component not included' + license_path: '' + - + name: 'Model card' + description: 'Model details including performance metrics, intended use, and limitations' + location: '' + license_name: 'License not specified' + license_path: '' + - + name: 'Data card' + description: 'Documentation for datasets including source, characteristics, and preprocessing details' + location: '' + license_name: 'Component not included' + license_path: '' + - + name: 'Technical report' + description: 'Technical report detailing capabilities and usage instructions for the model' + location: '' + license_name: 'License not specified' + license_path: '' + - + name: 'Research paper' + description: 'Research paper detailing the development and capabilities of the model' + location: '' + license_name: 'License not specified' + license_path: '' + - + name: 'Evaluation results' + description: 'The results from evaluating the model' + location: '' + license_name: 'License not specified' + license_path: '' diff --git "a/models/PanGu-\316\261.yml" "b/models/PanGu-\316\261.yml" new file mode 100644 index 0000000..2df326b --- /dev/null +++ "b/models/PanGu-\316\261.yml" @@ -0,0 +1,116 @@ +framework: + name: 'Model Openness Framework' + version: '1.0' + date: '2024-12-15' +release: + name: PanGu-α + version: 200B + date: '2024-11-14' + type: language + architecture: decoder + origin: '' + producer: Huawei + contact: '' + components: + - + name: 'Model architecture' + description: "Well commented code for the model's architecture" + location: '' + license_name: 'Pending evaluation' + license_path: '' + - + name: 'Data preprocessing code' + description: 'Code for data cleansing, normalization, and augmentation' + location: '' + license_name: 'Pending evaluation' + license_path: '' + - + name: 'Training code' + description: 'Code used for training the model' + location: '' + license_name: 'Pending evaluation' + license_path: '' + - + name: 'Inference code' + description: 'Code used for running the model to make predictions' + location: '' + license_name: 'Pending evaluation' + license_path: '' + - + name: 'Evaluation code' + description: 'Code used for evaluating the model' + location: '' + license_name: 'Pending evaluation' + license_path: '' + - + name: 'Supporting libraries and tools' + description: "Libraries and tools used in the model's development" + location: '' + license_name: 'Pending evaluation' + license_path: '' + - + name: 'Model parameters (Final)' + description: 'Trained model parameters, weights and biases' + location: '' + license_name: 'Pending evaluation' + license_path: '' + - + name: 'Model parameters (Intermediate)' + description: 'Trained model parameters, weights and biases' + location: '' + license_name: 'Pending evaluation' + license_path: '' + - + name: Datasets + description: 'Training, validation and testing datasets used for the model' + location: '' + license_name: 'Pending evaluation' + license_path: '' + - + name: 'Evaluation data' + description: 'Data used for evaluating the model' + location: '' + license_name: 'Pending evaluation' + license_path: '' + - + name: 'Model metadata' + description: 'Any model metadata including training configuration and optimizer states' + location: '' + license_name: 'Pending evaluation' + license_path: '' + - + name: 'Sample model outputs' + description: 'Examples of outputs generated by the model' + location: '' + license_name: 'Pending evaluation' + license_path: '' + - + name: 'Model card' + description: 'Model details including performance metrics, intended use, and limitations' + location: '' + license_name: 'Pending evaluation' + license_path: '' + - + name: 'Data card' + description: 'Documentation for datasets including source, characteristics, and preprocessing details' + location: '' + license_name: 'Pending evaluation' + license_path: '' + - + name: 'Technical report' + description: 'Technical report detailing capabilities and usage instructions for the model' + location: '' + license_name: 'Pending evaluation' + license_path: '' + - + name: 'Research paper' + description: 'Research paper detailing the development and capabilities of the model' + location: '' + license_name: 'License not specified' + license_path: '' + - + name: 'Evaluation results' + description: 'The results from evaluating the model' + location: '' + license_name: 'Pending evaluation' + license_path: '' diff --git a/models/StellarX-4B-V0.yml b/models/StellarX-4B-V0.yml new file mode 100644 index 0000000..1a4b961 --- /dev/null +++ b/models/StellarX-4B-V0.yml @@ -0,0 +1,117 @@ +framework: + name: 'Model Openness Framework' + version: '1.0' + date: '2024-12-15' +release: + name: StellarX-4B-V0 + version: 4B + date: '2024-11-14' + type: '' + architecture: decoder + origin: StellarX-4B-V0 + producer: 'Dampish, Arkane Industries' + contact: '' + huggingface: 'https://huggingface.co/Dampish/StellarX-4B-V0' + components: + - + name: 'Model architecture' + description: "Well commented code for the model's architecture" + location: '' + license_name: 'Component not include' + license_path: '' + - + name: 'Data preprocessing code' + description: 'Code for data cleansing, normalization, and augmentation' + location: '' + license_name: 'Component not included' + license_path: '' + - + name: 'Training code' + description: 'Code used for training the model' + location: '' + license_name: 'Component not included' + license_path: '' + - + name: 'Inference code' + description: 'Code used for running the model to make predictions' + location: '' + license_name: 'commercial use restrcitions; CC-BY-NC-SA-4.0' + license_path: '' + - + name: 'Evaluation code' + description: 'Code used for evaluating the model' + location: '' + license_name: 'Component not included' + license_path: '' + - + name: 'Supporting libraries and tools' + description: "Libraries and tools used in the model's development" + location: '' + license_name: 'License not specified' + license_path: '' + - + name: 'Model parameters (Final)' + description: 'Trained model parameters, weights and biases' + location: '' + license_name: 'Component not include.' + license_path: '' + - + name: 'Model parameters (Intermediate)' + description: 'Trained model parameters, weights and biases' + location: '' + license_name: 'Component not included' + license_path: '' + - + name: Datasets + description: 'Training, validation and testing datasets used for the model' + location: '' + license_name: 'License not specified' + license_path: '' + - + name: 'Evaluation data' + description: 'Data used for evaluating the model' + location: '' + license_name: 'Component not included' + license_path: '' + - + name: 'Model metadata' + description: 'Any model metadata including training configuration and optimizer states' + location: '' + license_name: 'License not specified' + license_path: '' + - + name: 'Sample model outputs' + description: 'Examples of outputs generated by the model' + location: '' + license_name: 'Component not included' + license_path: '' + - + name: 'Model card' + description: 'Model details including performance metrics, intended use, and limitations' + location: '' + license_name: 'License not specified' + license_path: '' + - + name: 'Data card' + description: 'Documentation for datasets including source, characteristics, and preprocessing details' + location: '' + license_name: 'License not specified' + license_path: '' + - + name: 'Technical report' + description: 'Technical report detailing capabilities and usage instructions for the model' + location: '' + license_name: 'License not specified' + license_path: '' + - + name: 'Research paper' + description: 'Research paper detailing the development and capabilities of the model' + location: '' + license_name: 'License not specified' + license_path: '' + - + name: 'Evaluation results' + description: 'The results from evaluating the model' + location: '' + license_name: 'License not specified' + license_path: ''