Skip to content

Commit 7954269

Browse files
committed
Implemented CR Notes
1 parent 32fa84c commit 7954269

File tree

3 files changed

+117
-21
lines changed

3 files changed

+117
-21
lines changed

MLBOM/Dataset/bom.json

Lines changed: 66 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -19,6 +19,15 @@
1919
"publisher": "Hugging Face Inc",
2020
"name": "wikipedia",
2121
"version": "b04c8d1ceb2f5cd4588862100d08de323dccfbaa",
22+
"data": [
23+
{
24+
"type": "dataset",
25+
"name": "wikipedia",
26+
"contents": {
27+
"url": "https://huggingface.co/datasets/wikimedia/wikipedia",
28+
}
29+
}
30+
],
2231
"licenses": [
2332
{
2433
"license": {
@@ -47,21 +56,63 @@
4756
"content": "b04c8d1ceb2f5cd4588862100d08de323dccfbaa"
4857
}
4958
],
50-
"tags": [
51-
"task_categories:text-generation",
52-
"task_categories:fill-mask",
53-
"task_ids:language-modeling",
54-
"task_ids:masked-language-modeling",
55-
"language:en",
56-
"language:es",
57-
"size_categories:10M<n<100M",
58-
"format:parquet",
59-
"modality:text",
60-
"library:datasets",
61-
"library:dask",
62-
"library:mlcroissant",
63-
"library:polars",
64-
"region:us"
59+
"properties": [
60+
{
61+
"name": "task_categories",
62+
"value": "text-generation"
63+
},
64+
{
65+
"name": "task_categories",
66+
"value": "fill-mask"
67+
},
68+
{
69+
"name": "task_ids",
70+
"value": "language-modeling"
71+
},
72+
{
73+
"name": "task_ids",
74+
"value": "masked-language-modeling"
75+
},
76+
{
77+
"name": "language",
78+
"value": "en"
79+
},
80+
{
81+
"name": "language",
82+
"value": "es"
83+
},
84+
{
85+
"name": "size_categories",
86+
"value": "10M<n<100M"
87+
},
88+
{
89+
"name": "format",
90+
"value": "parquet"
91+
},
92+
{
93+
"name": "modality",
94+
"value": "text"
95+
},
96+
{
97+
"name": "library",
98+
"value": "datasets"
99+
},
100+
{
101+
"name": "library",
102+
"value": "dask"
103+
},
104+
{
105+
"name": "library",
106+
"value": "mlcroissant"
107+
},
108+
{
109+
"name": "library",
110+
"value": "polars"
111+
},
112+
{
113+
"name": "region",
114+
"value": "us"
115+
}
65116
]
66117
}
67118
]

MLBOM/Model/FoundationModels/bom.json

Lines changed: 22 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,28 @@
2020
"name": "OpenAI Inc"
2121
},
2222
"publisher": "OpenAI Inc",
23-
"name": "gpt-4o"
23+
"name": "gpt-4o",
24+
"modelCard": {
25+
"modelParameters": {
26+
"modelArchitecture": "GPT-4",
27+
"inputs": [
28+
{
29+
"format": "string"
30+
},
31+
{
32+
"format": "image"
33+
}
34+
],
35+
"outputs": [
36+
{
37+
"format": "string"
38+
},
39+
{
40+
"format": "image"
41+
}
42+
]
43+
}
44+
}
2445
}
2546
]
2647
}

MLBOM/Model/OpenSource/bom.json

Lines changed: 29 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -40,6 +40,34 @@
4040
"content": "cd5ef92a9fb2f889e972770a36d4ed042daf221e"
4141
}
4242
],
43+
"modelCard": {
44+
"modelParameters": {
45+
"datasets": [
46+
{
47+
"type": "dataset",
48+
"name": "legacy-datasets/wikipedia",
49+
"contents": {
50+
"url": "https://huggingface.co/datasets/legacy-datasets/wikipedia"
51+
},
52+
"description": "Wikipedia dataset containing cleaned articles of all languages."
53+
},
54+
{
55+
"type": "dataset",
56+
"name": "bookcorpus/bookcorpus",
57+
"contents": {
58+
"url": "https://huggingface.co/datasets/bookcorpus/bookcorpus"
59+
},
60+
"description": "A corpus of fine-grained information and high-level semantics text"
61+
}
62+
]
63+
}
64+
},
65+
"properties": [
66+
{
67+
"name": "region",
68+
"value": "us"
69+
}
70+
],
4371
"tags": [
4472
"transformers",
4573
"pytorch",
@@ -50,13 +78,9 @@
5078
"fill-mask",
5179
"exbert",
5280
"en",
53-
"dataset:bookcorpus",
54-
"dataset:wikipedia",
5581
"arxiv:1810.04805",
56-
"license:apache-2.0",
5782
"autotrain_compatible",
58-
"endpoints_compatible",
59-
"region:us"
83+
"endpoints_compatible"
6084
]
6185
}
6286
]

0 commit comments

Comments
 (0)