Skip to content

Commit cde1228

Browse files
authored
Merge pull request #112 from lehors/update-models
Update models
2 parents 02e7502 + 8c020cb commit cde1228

File tree

6 files changed

+92
-83
lines changed

6 files changed

+92
-83
lines changed

models/BLOOM.yml

Lines changed: 28 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -4,41 +4,59 @@ framework:
44
date: '2024-12-15'
55
release:
66
name: BLOOM
7-
version: 176B
8-
date: '2024-11-15'
9-
license: { }
7+
version: 366B
8+
date: '2025-05-10'
109
type: language
1110
architecture: 'transformer decoder'
1211
origin: ''
1312
producer: BigScience
1413
contact: ''
14+
repository: ''
1515
huggingface: 'https://huggingface.co/bigscience/bloom'
16+
license:
17+
distribution:
18+
name: BigScience-BLOOM-RAIL-1.0
19+
path: ''
1620
components:
1721
-
1822
name: 'Model architecture'
1923
description: "Well commented code for the model's architecture"
20-
license: bigscience-bloom-rail-1.0
24+
-
25+
name: 'Training code'
26+
description: 'Code used for training the model'
27+
-
28+
name: 'Inference code'
29+
description: 'Code used for running the model to make predictions'
30+
-
31+
name: 'Evaluation code'
32+
description: 'Code used for evaluating the model'
2133
-
2234
name: 'Model parameters (Final)'
2335
description: 'Trained model parameters, weights and biases'
24-
license: 'BigScience RAIL License v1.0'
36+
-
37+
name: 'Model parameters (Intermediate)'
38+
description: 'Trained model parameters, weights and biases'
2539
-
2640
name: Datasets
2741
description: 'Training, validation and testing datasets used for the model'
28-
license: unlicensed
42+
-
43+
name: 'Model metadata'
44+
description: 'Any model metadata including training configuration and optimizer states'
2945
-
3046
name: 'Model card'
3147
description: 'Model details including performance metrics, intended use, and limitations'
32-
license: unlicensed
3348
-
3449
name: 'Data card'
3550
description: 'Documentation for datasets including source, characteristics, and preprocessing details'
36-
license: unlicensed
3751
-
3852
name: 'Technical report'
3953
description: 'Technical report detailing capabilities and usage instructions for the model'
40-
license: unlicensed
54+
license: CC-BY-4.0
4155
-
4256
name: 'Research paper'
4357
description: 'Research paper detailing the development and capabilities of the model'
44-
license: unlicensed
58+
component_path: 'https://arxiv.org/abs/2211.05100'
59+
license: CC-BY-4.0
60+
-
61+
name: 'Evaluation results'
62+
description: 'The results from evaluating the model'

models/Granite-20B-Code-Instruct.yml

Lines changed: 12 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -5,49 +5,46 @@ framework:
55
release:
66
name: Granite-20B-Code-Instruct
77
version: 20B
8-
date: '2024-11-15'
9-
license: { }
8+
date: '2025-05-09'
109
type: code
1110
architecture: 'transformer decoder'
1211
origin: Granite-20B-Code-Base
1312
producer: IBM
1413
contact: ''
1514
repository: 'https://github.com/ibm-granite/granite-code-models'
16-
huggingface: 'https://huggingface.co/ibm-granite/granite-20b-code-instruct'
15+
huggingface: 'https://huggingface.co/ibm-granite/granite-20b-code-instruct-8k'
16+
license:
17+
distribution:
18+
name: Apache-2.0
19+
path: ''
1720
components:
1821
-
1922
name: 'Model architecture'
2023
description: "Well commented code for the model's architecture"
21-
license: Apache-2.0
2224
-
2325
name: 'Model parameters (Final)'
2426
description: 'Trained model parameters, weights and biases'
25-
license: Apache-2.0
2627
-
2728
name: 'Model parameters (Intermediate)'
2829
description: 'Trained model parameters, weights and biases'
29-
license: Apache-2.0
3030
-
3131
name: Datasets
3232
description: 'Training, validation and testing datasets used for the model'
33-
license: unlicensed
33+
license: MIT
3434
-
3535
name: 'Model metadata'
3636
description: 'Any model metadata including training configuration and optimizer states'
37-
license: unlicensed
3837
-
3938
name: 'Model card'
4039
description: 'Model details including performance metrics, intended use, and limitations'
41-
license: unlicensed
4240
-
4341
name: 'Data card'
4442
description: 'Documentation for datasets including source, characteristics, and preprocessing details'
45-
license: unlicensed
46-
-
47-
name: 'Technical report'
48-
description: 'Technical report detailing capabilities and usage instructions for the model'
49-
license: unlicensed
5043
-
5144
name: 'Research paper'
5245
description: 'Research paper detailing the development and capabilities of the model'
53-
license: unlicensed
46+
component_path: 'https://arxiv.org/abs/2405.04324'
47+
license: CC-BY-4.0
48+
-
49+
name: 'Evaluation results'
50+
description: 'The results from evaluating the model'

models/Granite-34B-Code-Instruct.yml

Lines changed: 13 additions & 16 deletions
Original file line numberDiff line numberDiff line change
@@ -3,51 +3,48 @@ framework:
33
version: '1.0'
44
date: '2024-12-15'
55
release:
6-
name: Granite-34B-Code-Instruct
6+
name: Granite-34B-Code-Instruct-8K
77
version: 34B
8-
date: '2024-11-15'
9-
license: { }
8+
date: '2025-05-08'
109
type: code
1110
architecture: 'transformer decoder'
1211
origin: Granite-34B-Code-Base
1312
producer: IBM
1413
contact: ''
1514
repository: 'https://github.com/ibm-granite/granite-code-models'
16-
huggingface: 'https://huggingface.co/ibm-granite/granite-34b-code-instruct'
15+
huggingface: 'https://huggingface.co/ibm-granite/granite-34b-code-instruct-8k'
16+
license:
17+
distribution:
18+
name: Apache-2.0
19+
path: ''
1720
components:
1821
-
1922
name: 'Model architecture'
2023
description: "Well commented code for the model's architecture"
21-
license: Apache-2.0
2224
-
2325
name: 'Model parameters (Final)'
2426
description: 'Trained model parameters, weights and biases'
25-
license: Apache-2.0
2627
-
2728
name: 'Model parameters (Intermediate)'
2829
description: 'Trained model parameters, weights and biases'
29-
license: Apache-2.0
3030
-
3131
name: Datasets
3232
description: 'Training, validation and testing datasets used for the model'
33-
license: unlicensed
33+
license: MIT
3434
-
3535
name: 'Model metadata'
3636
description: 'Any model metadata including training configuration and optimizer states'
37-
license: unlicensed
3837
-
3938
name: 'Model card'
4039
description: 'Model details including performance metrics, intended use, and limitations'
41-
license: unlicensed
4240
-
4341
name: 'Data card'
4442
description: 'Documentation for datasets including source, characteristics, and preprocessing details'
45-
license: unlicensed
46-
-
47-
name: 'Technical report'
48-
description: 'Technical report detailing capabilities and usage instructions for the model'
49-
license: unlicensed
5043
-
5144
name: 'Research paper'
5245
description: 'Research paper detailing the development and capabilities of the model'
53-
license: unlicensed
46+
component_path: 'https://arxiv.org/abs/2405.04324'
47+
license: CC-BY-4.0
48+
-
49+
name: 'Evaluation results'
50+
description: 'The results from evaluating the model'

models/Granite-3B-Code-Instruct.yml

Lines changed: 12 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -5,49 +5,46 @@ framework:
55
release:
66
name: Granite-3B-Code-Instruct
77
version: 3B
8-
date: '2024-11-15'
9-
license: { }
8+
date: '2025-05-09'
109
type: code
1110
architecture: 'transformer decoder'
1211
origin: Granite-3B-Code-Base
1312
producer: IBM
1413
contact: ''
1514
repository: 'https://github.com/ibm-granite/granite-code-models'
16-
huggingface: 'https://huggingface.co/ibm-granite/granite-3b-code-instruct'
15+
huggingface: 'https://huggingface.co/ibm-granite/granite-3b-code-instruct-2k'
16+
license:
17+
distribution:
18+
name: Apache-2.0
19+
path: ''
1720
components:
1821
-
1922
name: 'Model architecture'
2023
description: "Well commented code for the model's architecture"
21-
license: Apache-2.0
2224
-
2325
name: 'Model parameters (Final)'
2426
description: 'Trained model parameters, weights and biases'
25-
license: Apache-2.0
2627
-
2728
name: 'Model parameters (Intermediate)'
2829
description: 'Trained model parameters, weights and biases'
29-
license: Apache-2.0
3030
-
3131
name: Datasets
3232
description: 'Training, validation and testing datasets used for the model'
33-
license: unlicensed
33+
license: MIT
3434
-
3535
name: 'Model metadata'
3636
description: 'Any model metadata including training configuration and optimizer states'
37-
license: unlicensed
3837
-
3938
name: 'Model card'
4039
description: 'Model details including performance metrics, intended use, and limitations'
41-
license: unlicensed
4240
-
4341
name: 'Data card'
4442
description: 'Documentation for datasets including source, characteristics, and preprocessing details'
45-
license: unlicensed
46-
-
47-
name: 'Technical report'
48-
description: 'Technical report detailing capabilities and usage instructions for the model'
49-
license: unlicensed
5043
-
5144
name: 'Research paper'
5245
description: 'Research paper detailing the development and capabilities of the model'
53-
license: unlicensed
46+
component_path: 'https://arxiv.org/abs/2405.04324'
47+
license: CC-BY-4.0
48+
-
49+
name: 'Evaluation results'
50+
description: 'The results from evaluating the model'

models/Granite-8B-Code-Instruct.yml

Lines changed: 12 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -5,49 +5,46 @@ framework:
55
release:
66
name: Granite-8B-Code-Instruct
77
version: 8B
8-
date: '2024-11-15'
9-
license: { }
8+
date: '2025-05-08'
109
type: code
1110
architecture: 'transformer decoder'
1211
origin: Granite-8B-Code-Base
1312
producer: IBM
1413
contact: ''
1514
repository: 'https://github.com/ibm-granite/granite-code-models'
16-
huggingface: 'https://huggingface.co/ibm-granite/granite-8b-code-instruct'
15+
huggingface: 'https://huggingface.co/ibm-granite/granite-8b-code-instruct-4k'
16+
license:
17+
distribution:
18+
name: Apache-2.0
19+
path: ''
1720
components:
1821
-
1922
name: 'Model architecture'
2023
description: "Well commented code for the model's architecture"
21-
license: Apache-2.0
2224
-
2325
name: 'Model parameters (Final)'
2426
description: 'Trained model parameters, weights and biases'
25-
license: Apache-2.0
2627
-
2728
name: 'Model parameters (Intermediate)'
2829
description: 'Trained model parameters, weights and biases'
29-
license: Apache-2.0
3030
-
3131
name: Datasets
3232
description: 'Training, validation and testing datasets used for the model'
33-
license: unlicensed
33+
license: MIT
3434
-
3535
name: 'Model metadata'
3636
description: 'Any model metadata including training configuration and optimizer states'
37-
license: unlicensed
3837
-
3938
name: 'Model card'
4039
description: 'Model details including performance metrics, intended use, and limitations'
41-
license: unlicensed
4240
-
4341
name: 'Data card'
4442
description: 'Documentation for datasets including source, characteristics, and preprocessing details'
45-
license: unlicensed
46-
-
47-
name: 'Technical report'
48-
description: 'Technical report detailing capabilities and usage instructions for the model'
49-
license: unlicensed
5043
-
5144
name: 'Research paper'
5245
description: 'Research paper detailing the development and capabilities of the model'
53-
license: unlicensed
46+
license: CC-BY-4.0
47+
component_path: 'https://arxiv.org/abs/2405.04324'
48+
-
49+
name: 'Evaluation results'
50+
description: 'The results from evaluating the model'

models/OLMO-7B.yml

Lines changed: 15 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -5,53 +5,56 @@ framework:
55
release:
66
name: OLMO-7B
77
version: 7B
8-
date: '2024-11-15'
9-
license: { }
8+
date: '2025-05-16'
109
type: language
1110
architecture: transformer
1211
origin: oLMO
1312
producer: 'Allen Institute'
1413
contact: ''
1514
repository: 'https://github.com/allenai/OLMo'
1615
huggingface: 'https://huggingface.co/allenai/OLMo-7B'
16+
license:
17+
distribution:
18+
name: Apache-2.0
19+
path: ''
1720
components:
1821
-
1922
name: 'Model architecture'
2023
description: "Well commented code for the model's architecture"
21-
license: Apache-2.0
2224
-
2325
name: 'Data preprocessing code'
2426
description: 'Code for data cleansing, normalization, and augmentation'
25-
license: Apache-2.0
2627
-
2728
name: 'Training code'
2829
description: 'Code used for training the model'
29-
license: Apache-2.0
3030
-
3131
name: 'Inference code'
3232
description: 'Code used for running the model to make predictions'
33-
license: Apache-2.0
3433
-
3534
name: 'Evaluation code'
3635
description: 'Code used for evaluating the model'
37-
license: Apache-2.0
3836
-
3937
name: 'Model parameters (Final)'
4038
description: 'Trained model parameters, weights and biases'
41-
license: Apache-2.0
4239
-
4340
name: 'Model parameters (Intermediate)'
4441
description: 'Trained model parameters, weights and biases'
45-
license: Apache-2.0
4642
-
4743
name: Datasets
4844
description: 'Training, validation and testing datasets used for the model'
49-
license: Apache-2.0
5045
-
5146
name: 'Evaluation data'
5247
description: 'Data used for evaluating the model'
53-
license: unlicensed
48+
-
49+
name: 'Model card'
50+
description: 'Model details including performance metrics, intended use, and limitations'
51+
-
52+
name: 'Data card'
53+
description: 'Documentation for datasets including source, characteristics, and preprocessing details'
5454
-
5555
name: 'Research paper'
5656
description: 'Research paper detailing the development and capabilities of the model'
57-
license: unlicensed
57+
license: CC-BY-4.0
58+
-
59+
name: 'Evaluation results'
60+
description: 'The results from evaluating the model'

0 commit comments

Comments
 (0)