Skip to content

Commit e49932d

Browse files
authored
Merge pull request #178 from lehors/pythia-update
Update Pythia models
2 parents 5279ab6 + d51db10 commit e49932d

18 files changed

+604
-236
lines changed

models/Pythia-1.4B.yml

Lines changed: 75 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,75 @@
1+
framework:
2+
name: 'Model Openness Framework'
3+
version: '1.0'
4+
date: '2024-12-15'
5+
release:
6+
name: Pythia-1.4B
7+
version: 1.4B
8+
date: '2025-11-03'
9+
type: language
10+
architecture: transformer
11+
origin: ''
12+
producer: EleutherAI
13+
contact: ''
14+
repository: 'https://github.com/EleutherAI/pythia'
15+
huggingface: 'https://huggingface.co/EleutherAI/pythia-1.4b'
16+
license:
17+
distribution:
18+
name: Apache-2.0
19+
path: ''
20+
components:
21+
-
22+
name: 'Model architecture'
23+
description: "Well commented code for the model's architecture"
24+
-
25+
name: 'Data preprocessing code'
26+
description: 'Code for data cleansing, normalization, and augmentation'
27+
component_path: 'https://github.com/EleutherAI/the-pile'
28+
license: MIT
29+
license_path: 'https://github.com/EleutherAI/the-pile/blob/master/LICENSE'
30+
-
31+
name: 'Training code'
32+
description: 'Code used for training the model'
33+
license: MIT
34+
-
35+
name: 'Inference code'
36+
description: 'Code used for running the model to make predictions'
37+
-
38+
name: 'Evaluation code'
39+
description: 'Code used for evaluating the model'
40+
component_path: 'https://github.com/EleutherAI/lm-evaluation-harness'
41+
license: MIT
42+
license_path: 'https://github.com/EleutherAI/lm-evaluation-harness/blob/main/LICENSE.md'
43+
-
44+
name: 'Supporting libraries and tools'
45+
description: "Libraries and tools used in the model's development"
46+
-
47+
name: 'Model parameters (Final)'
48+
description: 'Trained model parameters, weights and biases'
49+
-
50+
name: 'Model parameters (Intermediate)'
51+
description: 'Trained model parameters, weights and biases'
52+
-
53+
name: Datasets
54+
description: 'Training, validation and testing datasets used for the model'
55+
component_path: 'https://pile.eleuther.ai/'
56+
-
57+
name: 'Evaluation data'
58+
description: 'Data used for evaluating the model'
59+
-
60+
name: 'Model metadata'
61+
description: 'Any model metadata including training configuration and optimizer states'
62+
-
63+
name: 'Model card'
64+
description: 'Model details including performance metrics, intended use, and limitations'
65+
-
66+
name: 'Data card'
67+
description: 'Documentation for datasets including source, characteristics, and preprocessing details'
68+
-
69+
name: 'Research paper'
70+
description: 'Research paper detailing the development and capabilities of the model'
71+
component_path: 'https://arxiv.org/abs/2304.01373'
72+
license: CC-BY-SA-4.0
73+
-
74+
name: 'Evaluation results'
75+
description: 'The results from evaluating the model'

models/Pythia-12B.yml

Lines changed: 75 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,75 @@
1+
framework:
2+
name: 'Model Openness Framework'
3+
version: '1.0'
4+
date: '2024-12-15'
5+
release:
6+
name: Pythia-12B
7+
version: 12B
8+
date: '2025-11-03'
9+
type: language
10+
architecture: transformer
11+
origin: ''
12+
producer: EleutherAI
13+
contact: ''
14+
repository: 'https://github.com/EleutherAI/pythia'
15+
huggingface: 'https://huggingface.co/EleutherAI/pythia-12b'
16+
license:
17+
distribution:
18+
name: Apache-2.0
19+
path: ''
20+
components:
21+
-
22+
name: 'Model architecture'
23+
description: "Well commented code for the model's architecture"
24+
-
25+
name: 'Data preprocessing code'
26+
description: 'Code for data cleansing, normalization, and augmentation'
27+
component_path: 'https://github.com/EleutherAI/the-pile'
28+
license: MIT
29+
license_path: 'https://github.com/EleutherAI/the-pile/blob/master/LICENSE'
30+
-
31+
name: 'Training code'
32+
description: 'Code used for training the model'
33+
license: MIT
34+
-
35+
name: 'Inference code'
36+
description: 'Code used for running the model to make predictions'
37+
-
38+
name: 'Evaluation code'
39+
description: 'Code used for evaluating the model'
40+
component_path: 'https://github.com/EleutherAI/lm-evaluation-harness'
41+
license: MIT
42+
license_path: 'https://github.com/EleutherAI/lm-evaluation-harness/blob/main/LICENSE.md'
43+
-
44+
name: 'Supporting libraries and tools'
45+
description: "Libraries and tools used in the model's development"
46+
-
47+
name: 'Model parameters (Final)'
48+
description: 'Trained model parameters, weights and biases'
49+
-
50+
name: 'Model parameters (Intermediate)'
51+
description: 'Trained model parameters, weights and biases'
52+
-
53+
name: Datasets
54+
description: 'Training, validation and testing datasets used for the model'
55+
component_path: 'https://pile.eleuther.ai/'
56+
-
57+
name: 'Evaluation data'
58+
description: 'Data used for evaluating the model'
59+
-
60+
name: 'Model metadata'
61+
description: 'Any model metadata including training configuration and optimizer states'
62+
-
63+
name: 'Model card'
64+
description: 'Model details including performance metrics, intended use, and limitations'
65+
-
66+
name: 'Data card'
67+
description: 'Documentation for datasets including source, characteristics, and preprocessing details'
68+
-
69+
name: 'Research paper'
70+
description: 'Research paper detailing the development and capabilities of the model'
71+
component_path: 'https://arxiv.org/abs/2304.01373'
72+
license: CC-BY-SA-4.0
73+
-
74+
name: 'Evaluation results'
75+
description: 'The results from evaluating the model'

models/pythia-14M.yml renamed to models/Pythia-14M.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@ framework:
33
version: '1.0'
44
date: '2024-12-15'
55
release:
6-
name: pythia-14M
6+
name: Pythia-14M
77
version: 14M
88
date: '2025-05-22'
99
type: language
@@ -12,7 +12,7 @@ release:
1212
producer: EleutherAI
1313
contact: ''
1414
repository: ''
15-
huggingface: EleutherAI/pythia-14m
15+
huggingface: 'https://huggingface.co/EleutherAI/pythia-14m'
1616
license: { }
1717
components:
1818
-

models/Pythia-160M.yml

Lines changed: 75 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,75 @@
1+
framework:
2+
name: 'Model Openness Framework'
3+
version: '1.0'
4+
date: '2024-12-15'
5+
release:
6+
name: Pythia-160M
7+
version: 160M
8+
date: '2025-11-03'
9+
type: language
10+
architecture: transformer
11+
origin: ''
12+
producer: EleutherAI
13+
contact: ''
14+
repository: 'https://github.com/EleutherAI/pythia'
15+
huggingface: 'https://huggingface.co/EleutherAI/pythia-160m'
16+
license:
17+
distribution:
18+
name: Apache-2.0
19+
path: ''
20+
components:
21+
-
22+
name: 'Model architecture'
23+
description: "Well commented code for the model's architecture"
24+
-
25+
name: 'Data preprocessing code'
26+
description: 'Code for data cleansing, normalization, and augmentation'
27+
component_path: 'https://github.com/EleutherAI/the-pile'
28+
license: MIT
29+
license_path: 'https://github.com/EleutherAI/the-pile/blob/master/LICENSE'
30+
-
31+
name: 'Training code'
32+
description: 'Code used for training the model'
33+
license: MIT
34+
-
35+
name: 'Inference code'
36+
description: 'Code used for running the model to make predictions'
37+
-
38+
name: 'Evaluation code'
39+
description: 'Code used for evaluating the model'
40+
component_path: 'https://github.com/EleutherAI/lm-evaluation-harness'
41+
license: MIT
42+
license_path: 'https://github.com/EleutherAI/lm-evaluation-harness/blob/main/LICENSE.md'
43+
-
44+
name: 'Supporting libraries and tools'
45+
description: "Libraries and tools used in the model's development"
46+
-
47+
name: 'Model parameters (Final)'
48+
description: 'Trained model parameters, weights and biases'
49+
-
50+
name: 'Model parameters (Intermediate)'
51+
description: 'Trained model parameters, weights and biases'
52+
-
53+
name: Datasets
54+
description: 'Training, validation and testing datasets used for the model'
55+
component_path: 'https://pile.eleuther.ai/'
56+
-
57+
name: 'Evaluation data'
58+
description: 'Data used for evaluating the model'
59+
-
60+
name: 'Model metadata'
61+
description: 'Any model metadata including training configuration and optimizer states'
62+
-
63+
name: 'Model card'
64+
description: 'Model details including performance metrics, intended use, and limitations'
65+
-
66+
name: 'Data card'
67+
description: 'Documentation for datasets including source, characteristics, and preprocessing details'
68+
-
69+
name: 'Research paper'
70+
description: 'Research paper detailing the development and capabilities of the model'
71+
component_path: 'https://arxiv.org/abs/2304.01373'
72+
license: CC-BY-SA-4.0
73+
-
74+
name: 'Evaluation results'
75+
description: 'The results from evaluating the model'

models/Pythia-1B.yml

Lines changed: 75 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,75 @@
1+
framework:
2+
name: 'Model Openness Framework'
3+
version: '1.0'
4+
date: '2024-12-15'
5+
release:
6+
name: Pythia-1B
7+
version: 1B
8+
date: '2025-11-03'
9+
type: language
10+
architecture: transformer
11+
origin: ''
12+
producer: EleutherAI
13+
contact: ''
14+
repository: 'https://github.com/EleutherAI/pythia'
15+
huggingface: 'https://huggingface.co/EleutherAI/pythia-1b'
16+
license:
17+
distribution:
18+
name: Apache-2.0
19+
path: ''
20+
components:
21+
-
22+
name: 'Model architecture'
23+
description: "Well commented code for the model's architecture"
24+
-
25+
name: 'Data preprocessing code'
26+
description: 'Code for data cleansing, normalization, and augmentation'
27+
component_path: 'https://github.com/EleutherAI/the-pile'
28+
license: MIT
29+
license_path: 'https://github.com/EleutherAI/the-pile/blob/master/LICENSE'
30+
-
31+
name: 'Training code'
32+
description: 'Code used for training the model'
33+
license: MIT
34+
-
35+
name: 'Inference code'
36+
description: 'Code used for running the model to make predictions'
37+
-
38+
name: 'Evaluation code'
39+
description: 'Code used for evaluating the model'
40+
component_path: 'https://github.com/EleutherAI/lm-evaluation-harness'
41+
license: MIT
42+
license_path: 'https://github.com/EleutherAI/lm-evaluation-harness/blob/main/LICENSE.md'
43+
-
44+
name: 'Supporting libraries and tools'
45+
description: "Libraries and tools used in the model's development"
46+
-
47+
name: 'Model parameters (Final)'
48+
description: 'Trained model parameters, weights and biases'
49+
-
50+
name: 'Model parameters (Intermediate)'
51+
description: 'Trained model parameters, weights and biases'
52+
-
53+
name: Datasets
54+
description: 'Training, validation and testing datasets used for the model'
55+
component_path: 'https://pile.eleuther.ai/'
56+
-
57+
name: 'Evaluation data'
58+
description: 'Data used for evaluating the model'
59+
-
60+
name: 'Model metadata'
61+
description: 'Any model metadata including training configuration and optimizer states'
62+
-
63+
name: 'Model card'
64+
description: 'Model details including performance metrics, intended use, and limitations'
65+
-
66+
name: 'Data card'
67+
description: 'Documentation for datasets including source, characteristics, and preprocessing details'
68+
-
69+
name: 'Research paper'
70+
description: 'Research paper detailing the development and capabilities of the model'
71+
component_path: 'https://arxiv.org/abs/2304.01373'
72+
license: CC-BY-SA-4.0
73+
-
74+
name: 'Evaluation results'
75+
description: 'The results from evaluating the model'

models/Pythia-2.8B.yml

Lines changed: 75 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,75 @@
1+
framework:
2+
name: 'Model Openness Framework'
3+
version: '1.0'
4+
date: '2024-12-15'
5+
release:
6+
name: Pythia-2.8B
7+
version: 2.8B
8+
date: '2025-11-03'
9+
type: language
10+
architecture: transformer
11+
origin: ''
12+
producer: EleutherAI
13+
contact: ''
14+
repository: 'https://github.com/EleutherAI/pythia'
15+
huggingface: 'https://huggingface.co/EleutherAI/pythia-2.8b'
16+
license:
17+
distribution:
18+
name: Apache-2.0
19+
path: ''
20+
components:
21+
-
22+
name: 'Model architecture'
23+
description: "Well commented code for the model's architecture"
24+
-
25+
name: 'Data preprocessing code'
26+
description: 'Code for data cleansing, normalization, and augmentation'
27+
component_path: 'https://github.com/EleutherAI/the-pile'
28+
license: MIT
29+
license_path: 'https://github.com/EleutherAI/the-pile/blob/master/LICENSE'
30+
-
31+
name: 'Training code'
32+
description: 'Code used for training the model'
33+
license: MIT
34+
-
35+
name: 'Inference code'
36+
description: 'Code used for running the model to make predictions'
37+
-
38+
name: 'Evaluation code'
39+
description: 'Code used for evaluating the model'
40+
component_path: 'https://github.com/EleutherAI/lm-evaluation-harness'
41+
license: MIT
42+
license_path: 'https://github.com/EleutherAI/lm-evaluation-harness/blob/main/LICENSE.md'
43+
-
44+
name: 'Supporting libraries and tools'
45+
description: "Libraries and tools used in the model's development"
46+
-
47+
name: 'Model parameters (Final)'
48+
description: 'Trained model parameters, weights and biases'
49+
-
50+
name: 'Model parameters (Intermediate)'
51+
description: 'Trained model parameters, weights and biases'
52+
-
53+
name: Datasets
54+
description: 'Training, validation and testing datasets used for the model'
55+
component_path: 'https://pile.eleuther.ai/'
56+
-
57+
name: 'Evaluation data'
58+
description: 'Data used for evaluating the model'
59+
-
60+
name: 'Model metadata'
61+
description: 'Any model metadata including training configuration and optimizer states'
62+
-
63+
name: 'Model card'
64+
description: 'Model details including performance metrics, intended use, and limitations'
65+
-
66+
name: 'Data card'
67+
description: 'Documentation for datasets including source, characteristics, and preprocessing details'
68+
-
69+
name: 'Research paper'
70+
description: 'Research paper detailing the development and capabilities of the model'
71+
component_path: 'https://arxiv.org/abs/2304.01373'
72+
license: CC-BY-SA-4.0
73+
-
74+
name: 'Evaluation results'
75+
description: 'The results from evaluating the model'

0 commit comments

Comments
 (0)