Skip to content

Commit

Permalink
added ml bom
Browse files Browse the repository at this point in the history
  • Loading branch information
galmo-noma committed Nov 25, 2024
1 parent d78f472 commit 177f679
Show file tree
Hide file tree
Showing 4 changed files with 505 additions and 0 deletions.
388 changes: 388 additions & 0 deletions MLBOM/Dataset/bom.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,388 @@
{
"$schema": "http://cyclonedx.org/schema/bom-1.6.schema.json",
"bomFormat": "CycloneDX",
"specVersion": "1.6",
"serialNumber": "urn:uuid:75de3b9b-9e53-4421-a259-11f18afc22bf",
"version": 1,
"metadata": {
"timestamp": "2024-11-24T13:10:49Z",
},
"components": [
{
"type": "data",
"supplier": {
"name": "Wikimedia"
},
"manufacturer": {
"name": "Wikimedia"
},
"publisher": "Hugging Face Inc",
"name": "wikipedia",
"version": "b04c8d1ceb2f5cd4588862100d08de323dccfbaa",
"licenses": [
{
"license": {
"id": "CC-BY-SA-3.0",
"name": "Creative Commons Attribution Share Alike 3.0",
"url": "https://spdx.org/licenses/CC-BY-SA-3.0.html"
}
},
{
"license": {
"id": "GFDL-1.3",
"name": "GNU Free Documentation License family",
"url": "https://www.gnu.org/licenses/fdl-1.3.en.html"
}
}
],
"externalReferences": [
{
"type": "website",
"url": "https://huggingface.co/datasets/wikimedia/wikipedia"
}
],
"hashes": [
{
"alg": "SHA-1",
"content": "b04c8d1ceb2f5cd4588862100d08de323dccfbaa"
}
],
"tags": [
"task_categories:text-generation",
"task_categories:fill-mask",
"task_ids:language-modeling",
"task_ids:masked-language-modeling",
"language:ab",
"language:ace",
"language:ady",
"language:af",
"language:alt",
"language:am",
"language:ami",
"language:an",
"language:ang",
"language:anp",
"language:ar",
"language:arc",
"language:ary",
"language:arz",
"language:as",
"language:ast",
"language:atj",
"language:av",
"language:avk",
"language:awa",
"language:ay",
"language:az",
"language:azb",
"language:ba",
"language:ban",
"language:bar",
"language:bbc",
"language:bcl",
"language:be",
"language:bg",
"language:bh",
"language:bi",
"language:bjn",
"language:blk",
"language:bm",
"language:bn",
"language:bo",
"language:bpy",
"language:br",
"language:bs",
"language:bug",
"language:bxr",
"language:ca",
"language:cbk",
"language:cdo",
"language:ce",
"language:ceb",
"language:ch",
"language:chr",
"language:chy",
"language:ckb",
"language:co",
"language:cr",
"language:crh",
"language:cs",
"language:csb",
"language:cu",
"language:cv",
"language:cy",
"language:da",
"language:dag",
"language:de",
"language:dga",
"language:din",
"language:diq",
"language:dsb",
"language:dty",
"language:dv",
"language:dz",
"language:ee",
"language:el",
"language:eml",
"language:en",
"language:eo",
"language:es",
"language:et",
"language:eu",
"language:ext",
"language:fa",
"language:fat",
"language:ff",
"language:fi",
"language:fj",
"language:fo",
"language:fon",
"language:fr",
"language:frp",
"language:frr",
"language:fur",
"language:fy",
"language:ga",
"language:gag",
"language:gan",
"language:gcr",
"language:gd",
"language:gl",
"language:glk",
"language:gn",
"language:gom",
"language:gor",
"language:got",
"language:gpe",
"language:gsw",
"language:gu",
"language:guc",
"language:gur",
"language:guw",
"language:gv",
"language:ha",
"language:hak",
"language:haw",
"language:hbs",
"language:he",
"language:hi",
"language:hif",
"language:hr",
"language:hsb",
"language:ht",
"language:hu",
"language:hy",
"language:hyw",
"language:ia",
"language:id",
"language:ie",
"language:ig",
"language:ik",
"language:ilo",
"language:inh",
"language:io",
"language:is",
"language:it",
"language:iu",
"language:ja",
"language:jam",
"language:jbo",
"language:jv",
"language:ka",
"language:kaa",
"language:kab",
"language:kbd",
"language:kbp",
"language:kcg",
"language:kg",
"language:ki",
"language:kk",
"language:kl",
"language:km",
"language:kn",
"language:ko",
"language:koi",
"language:krc",
"language:ks",
"language:ksh",
"language:ku",
"language:kv",
"language:kw",
"language:ky",
"language:la",
"language:lad",
"language:lb",
"language:lbe",
"language:lez",
"language:lfn",
"language:lg",
"language:li",
"language:lij",
"language:lld",
"language:lmo",
"language:ln",
"language:lo",
"language:lt",
"language:ltg",
"language:lv",
"language:lzh",
"language:mad",
"language:mai",
"language:map",
"language:mdf",
"language:mg",
"language:mhr",
"language:mi",
"language:min",
"language:mk",
"language:ml",
"language:mn",
"language:mni",
"language:mnw",
"language:mr",
"language:mrj",
"language:ms",
"language:mt",
"language:mwl",
"language:my",
"language:myv",
"language:mzn",
"language:nah",
"language:nan",
"language:nap",
"language:nds",
"language:ne",
"language:new",
"language:nia",
"language:nl",
"language:nn",
"language:no",
"language:nov",
"language:nqo",
"language:nrf",
"language:nso",
"language:nv",
"language:ny",
"language:oc",
"language:olo",
"language:om",
"language:or",
"language:os",
"language:pa",
"language:pag",
"language:pam",
"language:pap",
"language:pcd",
"language:pcm",
"language:pdc",
"language:pfl",
"language:pi",
"language:pih",
"language:pl",
"language:pms",
"language:pnb",
"language:pnt",
"language:ps",
"language:pt",
"language:pwn",
"language:qu",
"language:rm",
"language:rmy",
"language:rn",
"language:ro",
"language:ru",
"language:rue",
"language:rup",
"language:rw",
"language:sa",
"language:sah",
"language:sat",
"language:sc",
"language:scn",
"language:sco",
"language:sd",
"language:se",
"language:sg",
"language:sgs",
"language:shi",
"language:shn",
"language:si",
"language:sk",
"language:skr",
"language:sl",
"language:sm",
"language:smn",
"language:sn",
"language:so",
"language:sq",
"language:sr",
"language:srn",
"language:ss",
"language:st",
"language:stq",
"language:su",
"language:sv",
"language:sw",
"language:szl",
"language:szy",
"language:ta",
"language:tay",
"language:tcy",
"language:te",
"language:tet",
"language:tg",
"language:th",
"language:ti",
"language:tk",
"language:tl",
"language:tly",
"language:tn",
"language:to",
"language:tpi",
"language:tr",
"language:trv",
"language:ts",
"language:tt",
"language:tum",
"language:tw",
"language:ty",
"language:tyv",
"language:udm",
"language:ug",
"language:uk",
"language:ur",
"language:uz",
"language:ve",
"language:vec",
"language:vep",
"language:vi",
"language:vls",
"language:vo",
"language:vro",
"language:wa",
"language:war",
"language:wo",
"language:wuu",
"language:xal",
"language:xh",
"language:xmf",
"language:yi",
"language:yo",
"language:yue",
"language:za",
"language:zea",
"language:zgh",
"language:zh",
"language:zu",
"size_categories:10M<n<100M",
"format:parquet",
"modality:text",
"library:datasets",
"library:dask",
"library:mlcroissant",
"library:polars",
"region:us"
]
}
]
}
Loading

0 comments on commit 177f679

Please sign in to comment.