HuggingFaceM4
/

idefics2-8b

+{
+    "bomFormat": "CycloneDX",
+    "specVersion": "1.6",
+    "serialNumber": "urn:uuid:f23c2a8d-7038-4272-957e-ca97df335610",
+    "version": 1,
+    "metadata": {
+        "timestamp": "2025-06-05T09:38:20.021414+00:00",
+        "component": {
+            "type": "machine-learning-model",
+            "bom-ref": "HuggingFaceM4/idefics2-8b-7bb21b56-dde0-500e-bf25-f4c32e64aa26",
+            "name": "HuggingFaceM4/idefics2-8b",
+            "externalReferences": [
+                {
+                    "url": "https://huggingface.co/HuggingFaceM4/idefics2-8b",
+                    "type": "documentation"
+                }
+            ],
+            "modelCard": {
+                "modelParameters": {
+                    "task": "image-text-to-text",
+                    "architectureFamily": "idefics2",
+                    "modelArchitecture": "Idefics2ForConditionalGeneration",
+                    "datasets": [
+                        {
+                            "ref": "HuggingFaceM4/OBELICS-54e0c87c-8ce6-51eb-af0d-52a7ddb63e49"
+                        },
+                        {
+                            "ref": "laion/laion-coco-6e73f888-3348-5039-864c-d2250f312f2e"
+                        },
+                        {
+                            "ref": "wikipedia-8c5eb686-d691-517b-aad7-040fa51febc3"
+                        },
+                        {
+                            "ref": "facebook/pmd-71fff1f1-79e2-5837-818a-a847941edaff"
+                        },
+                        {
+                            "ref": "pixparse/idl-wds-5ddb0bef-9a41-5fb6-acce-2d16b0053443"
+                        },
+                        {
+                            "ref": "pixparse/pdfa-eng-wds-6e24c86a-28c2-50e7-80c1-b74796cd7222"
+                        },
+                        {
+                            "ref": "wendlerc/RenderedText-2ea0375f-e9a2-55d0-aa1e-734edec2644e"
+                        },
+                        {
+                            "ref": "HuggingFaceM4/the_cauldron-0b60b937-29a7-5f0c-9fa6-ec10bf894687"
+                        },
+                        {
+                            "ref": "teknium/OpenHermes-2.5-1a7eb3be-7eaa-5577-91f6-d4ad0d639c6c"
+                        },
+                        {
+                            "ref": "GAIR/lima-afa8f631-d0ed-59c0-a5a1-170c80a5117e"
+                        },
+                        {
+                            "ref": "databricks/databricks-dolly-15k-1008cfb1-7624-5c5b-93cc-d856239b86ea"
+                        },
+                        {
+                            "ref": "meta-math/MetaMathQA-c6cf810a-8b06-5552-a876-53681c5fe9a1"
+                        },
+                        {
+                            "ref": "TIGER-Lab/MathInstruct-9d9c997d-f6c1-5029-96fd-6003c4f0ec06"
+                        },
+                        {
+                            "ref": "microsoft/orca-math-word-problems-200k-611afa9f-b6db-5b9f-9a51-598e4ce79d0e"
+                        },
+                        {
+                            "ref": "camel-ai/math-9f7ffeb0-2fb3-5b72-9ca4-1b461f022e61"
+                        },
+                        {
+                            "ref": "AtlasUnified/atlas-math-sets-49141027-0c69-515d-8182-254cf889efae"
+                        },
+                        {
+                            "ref": "tiedong/goat-38642401-79d7-541d-a92f-d3d7acdb8db8"
+                        },
+                        {
+                            "ref": "Lin-Chen/ShareGPT4V-f6982603-3c10-5cd0-9d2d-83d573b61341"
+                        },
+                        {
+                            "ref": "jxu124/llava_conversation_58k-7dcd95f0-d26a-5075-89f4-4afc13a5b93f"
+                        }
+                    ]
+                },
+                "properties": [
+                    {
+                        "name": "library_name",
+                        "value": "transformers"
+                    }
+                ],
+                "consideration": {
+                    "useCases": "`idefics2-8b-base` and `idefics2-8b` can be used to perform inference on multimodal (image + text) tasks in which the input is composed of a text query along with one (or multiple) image(s). Text and images can be arbitrarily interleaved. That includes image captioning, visual question answering, etc. These model does not support image generation.For optimal results, we recommend fine-tuning `idefics2-8b` on one's specific use-case and data. In fact, the instruction-fine-tuned model (`idefics2-8b`) is significantly better at following instructions from users and thus should be preferred when using the models out-of-the-box or as a starting point for fine-tuning.`idefics2-8b` usually generates very short answers. For long generations, use `idefics2-8b-chatty`, which was further fine-tuned on long conversations.As a starting point, we provide fine-tuning codes that can be adapted for one's particular scenario:- With the [TRL library](https://github.com/huggingface/trl): [Script](https://gist.github.com/edbeeching/228652fc6c2b29a1641be5a5778223cb)- With the [Hugging Face Trainer](https://huggingface.co/docs/transformers/main/en/main_classes/trainer#api-reference%20][%20transformers.Trainer): [Tutorial notebook](https://colab.research.google.com/drive/1NtcTgRbSBKN7pYD3Vdx1j9m8pt3fhFDB?usp=sharing)"
+                }
+            },
+            "authors": [
+                {
+                    "name": "HuggingFaceM4"
+                }
+            ],
+            "licenses": [
+                {
+                    "license": {
+                        "id": "Apache-2.0",
+                        "url": "https://spdx.org/licenses/Apache-2.0.html"
+                    }
+                }
+            ],
+            "description": "- **Developed by:** Hugging Face- **Model type:** Multi-modal model (image+text)- **Language(s) (NLP):** en- **License:** Apache 2.0- **Parent Models:** [google/siglip-so400m-patch14-384](https://huggingface.co/google/siglip-so400m-patch14-384) and [mistralai/Mistral-7B-v0.1](https://huggingface.co/mistralai/Mistral-7B-v0.1)- **Resources for more information:**- Description of [OBELICS](https://huggingface.co/datasets/HuggingFaceM4/OBELICS): [OBELICS: An Open Web-Scale Filtered Dataset of Interleaved Image-Text Documents](https://huggingface.co/papers/2306.16527)- Paper: [What matters when building vision-language models?](https://huggingface.co/papers/2405.02246)",
+            "tags": [
+                "transformers",
+                "safetensors",
+                "idefics2",
+                "image-text-to-text",
+                "multimodal",
+                "vision",
+                "en",
+                "dataset:HuggingFaceM4/OBELICS",
+                "dataset:laion/laion-coco",
+                "dataset:wikipedia",
+                "dataset:facebook/pmd",
+                "dataset:pixparse/idl-wds",
+                "dataset:pixparse/pdfa-eng-wds",
+                "dataset:wendlerc/RenderedText",
+                "dataset:HuggingFaceM4/the_cauldron",
+                "dataset:teknium/OpenHermes-2.5",
+                "dataset:GAIR/lima",
+                "dataset:databricks/databricks-dolly-15k",
+                "dataset:meta-math/MetaMathQA",
+                "dataset:TIGER-Lab/MathInstruct",
+                "dataset:microsoft/orca-math-word-problems-200k",
+                "dataset:camel-ai/math",
+                "dataset:AtlasUnified/atlas-math-sets",
+                "dataset:tiedong/goat",
+                "dataset:Lin-Chen/ShareGPT4V",
+                "dataset:jxu124/llava_conversation_58k",
+                "arxiv:2306.16527",
+                "arxiv:2405.02246",
+                "arxiv:2307.06304",
+                "arxiv:2311.07575",
+                "arxiv:2103.03206",
+                "license:apache-2.0",
+                "text-generation-inference",
+                "endpoints_compatible",
+                "region:us"
+            ]
+        }
+    },
+    "components": [
+        {
+            "type": "data",
+            "bom-ref": "HuggingFaceM4/OBELICS-54e0c87c-8ce6-51eb-af0d-52a7ddb63e49",
+            "name": "HuggingFaceM4/OBELICS",
+            "data": [
+                {
+                    "type": "dataset",
+                    "bom-ref": "HuggingFaceM4/OBELICS-54e0c87c-8ce6-51eb-af0d-52a7ddb63e49",
+                    "name": "HuggingFaceM4/OBELICS",
+                    "contents": {
+                        "url": "https://huggingface.co/datasets/HuggingFaceM4/OBELICS",
+                        "properties": [
+                            {
+                                "name": "language",
+                                "value": "en"
+                            },
+                            {
+                                "name": "size_categories",
+                                "value": "100M<n<1B"
+                            },
+                            {
+                                "name": "pretty_name",
+                                "value": "OBELICS"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: default {\"split\": \"train\", \"path\": \"data/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: opt_out_docs_removed_2023_07_12 {\"split\": \"train\", \"path\": \"opt_out_docs_removed_2023_07_12/train-*\"}"
+                            },
+                            {
+                                "name": "license",
+                                "value": "cc-by-4.0"
+                            }
+                        ]
+                    },
+                    "governance": {
+                        "owners": [
+                            {
+                                "organization": {
+                                    "name": "HuggingFaceM4",
+                                    "url": "https://huggingface.co/HuggingFaceM4"
+                                }
+                            }
+                        ]
+                    },
+                    "description": "\n\t\n\t\t\n\t\tDataset Card for OBELICS\n\t\n\nOBELICS is an open, massive, and curated collection of interleaved image-text web documents, containing 141M English documents, 115B text tokens, and 353M images, extracted from Common Crawl dumps between February 2020 and February 2023. The collection and filtering steps are described in our paper.\nInterleaved image-text web documents are a succession of text paragraphs interleaved by images, such as web pages that contain images. Models trained on these\u2026 See the full description on the dataset page: https://huggingface.co/datasets/HuggingFaceM4/OBELICS."
+                }
+            ]
+        },
+        null,
+        {
+            "type": "data",
+            "bom-ref": "wikipedia-8c5eb686-d691-517b-aad7-040fa51febc3",
+            "name": "wikipedia",
+            "data": [
+                {
+                    "type": "dataset",
+                    "bom-ref": "wikipedia-8c5eb686-d691-517b-aad7-040fa51febc3",
+                    "name": "wikipedia",
+                    "contents": {
+                        "url": "https://huggingface.co/datasets/wikipedia",
+                        "properties": [
+                            {
+                                "name": "task_categories",
+                                "value": "text-generation, fill-mask"
+                            },
+                            {
+                                "name": "task_ids",
+                                "value": "language-modeling, masked-language-modeling"
+                            },
+                            {
+                                "name": "language",
+                                "value": "aa, ab, ace, af, ak, als, am, an, ang, ar, arc, arz, as, ast, atj, av, ay, az, azb, ba, bar, bcl, be, bg, bh, bi, bjn, bm, bn, bo, bpy, br, bs, bug, bxr, ca, cbk, cdo, ce, ceb, ch, cho, chr, chy, ckb, co, cr, crh, cs, csb, cu, cv, cy, da, de, din, diq, dsb, dty, dv, dz, ee, el, eml, en, eo, es, et, eu, ext, fa, ff, fi, fj, fo, fr, frp, frr, fur, fy, ga, gag, gan, gd, gl, glk, gn, gom, gor, got, gu, gv, ha, hak, haw, he, hi, hif, ho, hr, hsb, ht, hu, hy, ia, id, ie, ig, ii, ik, ilo, inh, io, is, it, iu, ja, jam, jbo, jv, ka, kaa, kab, kbd, kbp, kg, ki, kj, kk, kl, km, kn, ko, koi, krc, ks, ksh, ku, kv, kw, ky, la, lad, lb, lbe, lez, lfn, lg, li, lij, lmo, ln, lo, lrc, lt, ltg, lv, lzh, mai, mdf, mg, mh, mhr, mi, min, mk, ml, mn, mr, mrj, ms, mt, mus, mwl, my, myv, mzn, na, nah, nan, nap, nds, ne, new, ng, nl, nn, no, nov, nrf, nso, nv, ny, oc, olo, om, or, os, pa, pag, pam, pap, pcd, pdc, pfl, pi, pih, pl, pms, pnb, pnt, ps, pt, qu, rm, rmy, rn, ro, ru, rue, rup, rw, sa, sah, sat, sc, scn, sco, sd, se, sg, sgs, sh, si, sk, sl, sm, sn, so, sq, sr, srn, ss, st, stq, su, sv, sw, szl, ta, tcy, tdt, te, tg, th, ti, tk, tl, tn, to, tpi, tr, ts, tt, tum, tw, ty, tyv, udm, ug, uk, ur, uz, ve, vec, vep, vi, vls, vo, vro, wa, war, wo, wuu, xal, xh, xmf, yi, yo, yue, za, zea, zh, zu"
+                            },
+                            {
+                                "name": "size_categories",
+                                "value": "n<1K, 1K<n<10K, 10K<n<100K, 100K<n<1M, 1M<n<10M"
+                            },
+                            {
+                                "name": "annotations_creators",
+                                "value": "no-annotation"
+                            },
+                            {
+                                "name": "language_creators",
+                                "value": "crowdsourced"
+                            },
+                            {
+                                "name": "pretty_name",
+                                "value": "Wikipedia"
+                            },
+                            {
+                                "name": "source_datasets",
+                                "value": "original"
+                            },
+                            {
+                                "name": "paperswithcode_id",
+                                "value": null
+                            },
+                            {
+                                "name": "license",
+                                "value": "cc-by-sa-3.0, gfdl"
+                            }
+                        ]
+                    },
+                    "governance": {
+                        "owners": [
+                            {
+                                "organization": {
+                                    "name": "legacy-datasets",
+                                    "url": "https://huggingface.co/legacy-datasets"
+                                }
+                            }
+                        ]
+                    },
+                    "description": "Wikipedia dataset containing cleaned articles of all languages.\nThe datasets are built from the Wikipedia dump\n(https://dumps.wikimedia.org/) with one split per language. Each example\ncontains the content of one full Wikipedia article with cleaning to strip\nmarkdown and unwanted sections (references, etc.)."
+                }
+            ]
+        },
+        {
+            "type": "data",
+            "bom-ref": "facebook/pmd-71fff1f1-79e2-5837-818a-a847941edaff",
+            "name": "facebook/pmd",
+            "data": [
+                {
+                    "type": "dataset",
+                    "bom-ref": "facebook/pmd-71fff1f1-79e2-5837-818a-a847941edaff",
+                    "name": "facebook/pmd",
+                    "contents": {
+                        "url": "https://huggingface.co/datasets/facebook/pmd",
+                        "properties": [
+                            {
+                                "name": "task_categories",
+                                "value": "image-to-text"
+                            },
+                            {
+                                "name": "task_ids",
+                                "value": "image-captioning"
+                            },
+                            {
+                                "name": "language",
+                                "value": "en"
+                            },
+                            {
+                                "name": "size_categories",
+                                "value": "10M<n<100M"
+                            },
+                            {
+                                "name": "annotations_creators",
+                                "value": "found"
+                            },
+                            {
+                                "name": "language_creators",
+                                "value": "found"
+                            },
+                            {
+                                "name": "pretty_name",
+                                "value": "PMD"
+                            },
+                            {
+                                "name": "source_datasets",
+                                "value": "original"
+                            },
+                            {
+                                "name": "paperswithcode_id",
+                                "value": "pmd"
+                            },
+                            {
+                                "name": "license",
+                                "value": "cc-by-4.0"
+                            }
+                        ]
+                    },
+                    "governance": {
+                        "owners": [
+                            {
+                                "organization": {
+                                    "name": "facebook",
+                                    "url": "https://huggingface.co/facebook"
+                                }
+                            }
+                        ]
+                    },
+                    "description": "Introduced in FLAVA paper, Public Multimodal Dataset (PMD) is a collection of publicly-available image-text pairs datasets. PMD in total contains 70M image-text pairs with 68M unique images. The dataset contains pairs from Conceptual Captions, Conceptual Captions 12M, WIT, Localized Narratives, RedCaps, COCO, SBU Captions, Visual Genome and a subset of YFCC100M dataset."
+                }
+            ]
+        },
+        {
+            "type": "data",
+            "bom-ref": "pixparse/idl-wds-5ddb0bef-9a41-5fb6-acce-2d16b0053443",
+            "name": "pixparse/idl-wds",
+            "data": [
+                {
+                    "type": "dataset",
+                    "bom-ref": "pixparse/idl-wds-5ddb0bef-9a41-5fb6-acce-2d16b0053443",
+                    "name": "pixparse/idl-wds",
+                    "contents": {
+                        "url": "https://huggingface.co/datasets/pixparse/idl-wds",
+                        "properties": [
+                            {
+                                "name": "task_categories",
+                                "value": "image-to-text"
+                            },
+                            {
+                                "name": "size_categories",
+                                "value": "10M<n<100M"
+                            },
+                            {
+                                "name": "license",
+                                "value": "other"
+                            },
+                            {
+                                "name": "license_name",
+                                "value": "idl-train"
+                            },
+                            {
+                                "name": "license_link",
+                                "value": "LICENSE"
+                            }
+                        ]
+                    },
+                    "governance": {
+                        "owners": [
+                            {
+                                "organization": {
+                                    "name": "pixparse",
+                                    "url": "https://huggingface.co/pixparse"
+                                }
+                            }
+                        ]
+                    },
+                    "description": "\n\t\n\t\t\n\t\tDataset Card for Industry Documents Library (IDL)\n\t\n\n\n\t\n\t\t\n\t\tDataset Summary\n\t\n\nIndustry Documents Library (IDL) is a document dataset filtered from UCSF documents library with 19 million pages kept as valid samples.\nEach document exists as a collection of a pdf, a tiff image with the same contents rendered, a json file containing extensive Textract OCR annotations from the idl_data project, and a .ocr file with the original, older OCR annotation. In each pdf, there may be from 1 to up\u2026 See the full description on the dataset page: https://huggingface.co/datasets/pixparse/idl-wds."
+                }
+            ]
+        },
+        {
+            "type": "data",
+            "bom-ref": "pixparse/pdfa-eng-wds-6e24c86a-28c2-50e7-80c1-b74796cd7222",
+            "name": "pixparse/pdfa-eng-wds",
+            "data": [
+                {
+                    "type": "dataset",
+                    "bom-ref": "pixparse/pdfa-eng-wds-6e24c86a-28c2-50e7-80c1-b74796cd7222",
+                    "name": "pixparse/pdfa-eng-wds",
+                    "contents": {
+                        "url": "https://huggingface.co/datasets/pixparse/pdfa-eng-wds",
+                        "properties": [
+                            {
+                                "name": "task_categories",
+                                "value": "image-to-text"
+                            },
+                            {
+                                "name": "language",
+                                "value": "en"
+                            },
+                            {
+                                "name": "size_categories",
+                                "value": "10M<n<100M"
+                            },
+                            {
+                                "name": "license",
+                                "value": "other"
+                            },
+                            {
+                                "name": "license_name",
+                                "value": "pdfa-eng-wds"
+                            },
+                            {
+                                "name": "license_link",
+                                "value": "LICENSE"
+                            }
+                        ]
+                    },
+                    "governance": {
+                        "owners": [
+                            {
+                                "organization": {
+                                    "name": "pixparse",
+                                    "url": "https://huggingface.co/pixparse"
+                                }
+                            }
+                        ]
+                    },
+                    "description": "\n\t\n\t\t\n\t\tDataset Card for PDF Association dataset (PDFA)\n\t\n\n\n\t\n\t\t\n\t\tDataset Summary\n\t\n\nPDFA dataset is a document dataset filtered from the SafeDocs corpus, aka CC-MAIN-2021-31-PDF-UNTRUNCATED. The original purpose of that corpus is for comprehensive pdf documents analysis. The purpose of that subset differs in that regard, as focus has been done on making the dataset machine learning-ready for vision-language models. \n\n    \n    An example page of one pdf document, with added bounding boxes\u2026 See the full description on the dataset page: https://huggingface.co/datasets/pixparse/pdfa-eng-wds."
+                }
+            ]
+        },
+        {
+            "type": "data",
+            "bom-ref": "wendlerc/RenderedText-2ea0375f-e9a2-55d0-aa1e-734edec2644e",
+            "name": "wendlerc/RenderedText",
+            "data": [
+                {
+                    "type": "dataset",
+                    "bom-ref": "wendlerc/RenderedText-2ea0375f-e9a2-55d0-aa1e-734edec2644e",
+                    "name": "wendlerc/RenderedText",
+                    "contents": {
+                        "url": "https://huggingface.co/datasets/wendlerc/RenderedText",
+                        "properties": [
+                            {
+                                "name": "task_categories",
+                                "value": "text-to-image, image-to-text"
+                            },
+                            {
+                                "name": "language",
+                                "value": "en"
+                            },
+                            {
+                                "name": "size_categories",
+                                "value": "10M<n<100M"
+                            }
+                        ]
+                    },
+                    "governance": {
+                        "owners": [
+                            {
+                                "organization": {
+                                    "name": "wendlerc",
+                                    "url": "https://huggingface.co/wendlerc"
+                                }
+                            }
+                        ]
+                    },
+                    "description": "This dataset has been created by Stability AI and LAION.\nThis dataset contains 12 million 1024x1024 images of handwritten text written on a digital 3D sheet of paper generated using Blender geometry nodes and rendered using Blender Cycles. The text has varying font size, color, and rotation, and the paper was rendered under random lighting conditions.\nNote that, the first 10 million examples are in the root folder of this dataset repository and the remaining 2 million are in ./remaining (due\u2026 See the full description on the dataset page: https://huggingface.co/datasets/wendlerc/RenderedText."
+                }
+            ]
+        },
+        {
+            "type": "data",
+            "bom-ref": "HuggingFaceM4/the_cauldron-0b60b937-29a7-5f0c-9fa6-ec10bf894687",
+            "name": "HuggingFaceM4/the_cauldron",
+            "data": [
+                {
+                    "type": "dataset",
+                    "bom-ref": "HuggingFaceM4/the_cauldron-0b60b937-29a7-5f0c-9fa6-ec10bf894687",
+                    "name": "HuggingFaceM4/the_cauldron",
+                    "contents": {
+                        "url": "https://huggingface.co/datasets/HuggingFaceM4/the_cauldron",
+                        "properties": [
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: ai2d {\"split\": \"train\", \"path\": \"ai2d/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: aokvqa {\"split\": \"train\", \"path\": \"aokvqa/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: chart2text {\"split\": \"train\", \"path\": \"chart2text/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: chartqa {\"split\": \"train\", \"path\": \"chartqa/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: clevr {\"split\": \"train\", \"path\": \"clevr/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: clevr_math {\"split\": \"train\", \"path\": \"clevr_math/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: cocoqa {\"split\": \"train\", \"path\": \"cocoqa/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: datikz {\"split\": \"train\", \"path\": \"datikz/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: diagram_image_to_text {\"split\": \"train\", \"path\": \"diagram_image_to_text/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: docvqa {\"split\": \"train\", \"path\": \"docvqa/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: dvqa {\"split\": \"train\", \"path\": \"dvqa/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: figureqa {\"split\": \"train\", \"path\": \"figureqa/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: finqa {\"split\": \"train\", \"path\": \"finqa/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: geomverse {\"split\": \"train\", \"path\": \"geomverse/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: hateful_memes {\"split\": \"train\", \"path\": \"hateful_memes/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: hitab {\"split\": \"train\", \"path\": \"hitab/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: iam {\"split\": \"train\", \"path\": \"iam/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: iconqa {\"split\": \"train\", \"path\": \"iconqa/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: infographic_vqa {\"split\": \"train\", \"path\": \"infographic_vqa/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: intergps {\"split\": \"train\", \"path\": \"intergps/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: localized_narratives {\"split\": \"train\", \"path\": \"localized_narratives/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: mapqa {\"split\": \"train\", \"path\": \"mapqa/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: mimic_cgd {\"split\": \"train\", \"path\": \"mimic_cgd/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: multihiertt {\"split\": \"train\", \"path\": \"multihiertt/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: nlvr2 {\"split\": \"train\", \"path\": \"nlvr2/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: ocrvqa {\"split\": \"train\", \"path\": \"ocrvqa/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: okvqa {\"split\": \"train\", \"path\": \"okvqa/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: plotqa {\"split\": \"train\", \"path\": \"plotqa/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: raven {\"split\": \"train\", \"path\": \"raven/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: rendered_text {\"split\": \"train\", \"path\": \"rendered_text/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: robut_sqa {\"split\": \"train\", \"path\": \"robut_sqa/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: robut_wikisql {\"split\": \"train\", \"path\": \"robut_wikisql/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: robut_wtq {\"split\": \"train\", \"path\": \"robut_wtq/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: scienceqa {\"split\": \"train\", \"path\": \"scienceqa/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: screen2words {\"split\": \"train\", \"path\": \"screen2words/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: spot_the_diff {\"split\": \"train\", \"path\": \"spot_the_diff/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: st_vqa {\"split\": \"train\", \"path\": \"st_vqa/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: tabmwp {\"split\": \"train\", \"path\": \"tabmwp/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: tallyqa {\"split\": \"train\", \"path\": \"tallyqa/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: tat_qa {\"split\": \"train\", \"path\": \"tat_qa/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: textcaps {\"split\": \"train\", \"path\": \"textcaps/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: textvqa {\"split\": \"train\", \"path\": \"textvqa/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: tqa {\"split\": \"train\", \"path\": \"tqa/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: vistext {\"split\": \"train\", \"path\": \"vistext/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: visual7w {\"split\": \"train\", \"path\": \"visual7w/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: visualmrc {\"split\": \"train\", \"path\": \"visualmrc/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: vqarad {\"split\": \"train\", \"path\": \"vqarad/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: vqav2 {\"split\": \"train\", \"path\": \"vqav2/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: vsr {\"split\": \"train\", \"path\": \"vsr/train-*\"}"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: websight {\"split\": \"train\", \"path\": \"websight/train-*\"}"
+                            }
+                        ]
+                    },
+                    "governance": {
+                        "owners": [
+                            {
+                                "organization": {
+                                    "name": "HuggingFaceM4",
+                                    "url": "https://huggingface.co/HuggingFaceM4"
+                                }
+                            }
+                        ]
+                    },
+                    "description": "\n\t\n\t\t\n\t\tDataset Card for The Cauldron\n\t\n\n\n\n\t\n\t\t\n\t\tDataset description\n\t\n\nThe Cauldron is part of the Idefics2 release.\nIt is a massive collection of 50 vision-language datasets (training sets only) that were used for the fine-tuning of the vision-language model Idefics2.\n\n\t\n\t\t\n\t\tLoad the dataset\n\t\n\nTo load the dataset, install the library datasets with pip install datasets. Then,\nfrom datasets import load_dataset\nds = load_dataset(\"HuggingFaceM4/the_cauldron\", \"ai2d\")\n\nto download and load the\u2026 See the full description on the dataset page: https://huggingface.co/datasets/HuggingFaceM4/the_cauldron."
+                }
+            ]
+        },
+        {
+            "type": "data",
+            "bom-ref": "teknium/OpenHermes-2.5-1a7eb3be-7eaa-5577-91f6-d4ad0d639c6c",
+            "name": "teknium/OpenHermes-2.5",
+            "data": [
+                {
+                    "type": "dataset",
+                    "bom-ref": "teknium/OpenHermes-2.5-1a7eb3be-7eaa-5577-91f6-d4ad0d639c6c",
+                    "name": "teknium/OpenHermes-2.5",
+                    "contents": {
+                        "url": "https://huggingface.co/datasets/teknium/OpenHermes-2.5",
+                        "properties": [
+                            {
+                                "name": "language",
+                                "value": "eng"
+                            },
+                            {
+                                "name": "pretty_name",
+                                "value": "OpenHermes 2.5"
+                            }
+                        ]
+                    },
+                    "governance": {
+                        "owners": [
+                            {
+                                "organization": {
+                                    "name": "teknium",
+                                    "url": "https://huggingface.co/teknium"
+                                }
+                            }
+                        ]
+                    },
+                    "description": "\n\n\t\n\t\t\n\t\tDataset Card for Dataset Name\n\t\n\nThis is the dataset that made OpenHermes 2.5 and Nous Hermes 2 series of models.\nSupport me on GitHub sponsors <3 : https://github.com/sponsors/teknium1\n\n\t\n\t\t\n\t\tDataset Details\n\t\n\n\n\t\n\t\t\n\t\tDataset Description\n\t\n\nThe Open Hermes 2/2.5 and Nous Hermes 2 models have made significant advancements of SOTA LLM's over recent months, and are underpinned by this exact compilation and curation of many open source datasets and custom created synthetic datasets.\u2026 See the full description on the dataset page: https://huggingface.co/datasets/teknium/OpenHermes-2.5."
+                }
+            ]
+        },
+        {
+            "type": "data",
+            "bom-ref": "GAIR/lima-afa8f631-d0ed-59c0-a5a1-170c80a5117e",
+            "name": "GAIR/lima",
+            "data": [
+                {
+                    "type": "dataset",
+                    "bom-ref": "GAIR/lima-afa8f631-d0ed-59c0-a5a1-170c80a5117e",
+                    "name": "GAIR/lima",
+                    "contents": {
+                        "url": "https://huggingface.co/datasets/GAIR/lima",
+                        "properties": [
+                            {
+                                "name": "license",
+                                "value": "other"
+                            }
+                        ]
+                    },
+                    "governance": {
+                        "owners": [
+                            {
+                                "organization": {
+                                    "name": "GAIR",
+                                    "url": "https://huggingface.co/GAIR"
+                                }
+                            }
+                        ]
+                    },
+                    "description": "A high-quality dataset for efficient instruction tuning."
+                }
+            ]
+        },
+        {
+            "type": "data",
+            "bom-ref": "databricks/databricks-dolly-15k-1008cfb1-7624-5c5b-93cc-d856239b86ea",
+            "name": "databricks/databricks-dolly-15k",
+            "data": [
+                {
+                    "type": "dataset",
+                    "bom-ref": "databricks/databricks-dolly-15k-1008cfb1-7624-5c5b-93cc-d856239b86ea",
+                    "name": "databricks/databricks-dolly-15k",
+                    "contents": {
+                        "url": "https://huggingface.co/datasets/databricks/databricks-dolly-15k",
+                        "properties": [
+                            {
+                                "name": "task_categories",
+                                "value": "question-answering, summarization"
+                            },
+                            {
+                                "name": "language",
+                                "value": "en"
+                            },
+                            {
+                                "name": "size_categories",
+                                "value": "10K<n<100K"
+                            },
+                            {
+                                "name": "license",
+                                "value": "cc-by-sa-3.0"
+                            }
+                        ]
+                    },
+                    "governance": {
+                        "owners": [
+                            {
+                                "organization": {
+                                    "name": "databricks",
+                                    "url": "https://huggingface.co/databricks"
+                                }
+                            }
+                        ]
+                    },
+                    "description": "\n\t\n\t\t\n\t\tSummary\n\t\n\ndatabricks-dolly-15k is an open source dataset of instruction-following records generated by thousands of Databricks employees in several \nof the behavioral categories outlined in the InstructGPT paper, including brainstorming, classification, \nclosed QA, generation, information extraction, open QA, and summarization.\nThis dataset can be used for any purpose, whether academic or commercial,  under the terms of the \nCreative Commons Attribution-ShareAlike 3.0 Unported\u2026 See the full description on the dataset page: https://huggingface.co/datasets/databricks/databricks-dolly-15k."
+                }
+            ]
+        },
+        {
+            "type": "data",
+            "bom-ref": "meta-math/MetaMathQA-c6cf810a-8b06-5552-a876-53681c5fe9a1",
+            "name": "meta-math/MetaMathQA",
+            "data": [
+                {
+                    "type": "dataset",
+                    "bom-ref": "meta-math/MetaMathQA-c6cf810a-8b06-5552-a876-53681c5fe9a1",
+                    "name": "meta-math/MetaMathQA",
+                    "contents": {
+                        "url": "https://huggingface.co/datasets/meta-math/MetaMathQA",
+                        "properties": [
+                            {
+                                "name": "license",
+                                "value": "mit"
+                            }
+                        ]
+                    },
+                    "governance": {
+                        "owners": [
+                            {
+                                "organization": {
+                                    "name": "meta-math",
+                                    "url": "https://huggingface.co/meta-math"
+                                }
+                            }
+                        ]
+                    },
+                    "description": "View the project page:\nhttps://meta-math.github.io/\nsee our paper at https://arxiv.org/abs/2309.12284\n\n\t\n\t\t\n\t\tNote\n\t\n\nAll MetaMathQA data are augmented from the training sets of GSM8K and MATH. \nNone of the augmented data is from the testing set.\nYou can check the original_question in meta-math/MetaMathQA, each item is from the GSM8K or MATH train set.\n\n\t\n\t\t\n\t\tModel Details\n\t\n\nMetaMath-Mistral-7B is fully fine-tuned on the MetaMathQA datasets and based on the powerful Mistral-7B model. It is\u2026 See the full description on the dataset page: https://huggingface.co/datasets/meta-math/MetaMathQA."
+                }
+            ]
+        },
+        {
+            "type": "data",
+            "bom-ref": "TIGER-Lab/MathInstruct-9d9c997d-f6c1-5029-96fd-6003c4f0ec06",
+            "name": "TIGER-Lab/MathInstruct",
+            "data": [
+                {
+                    "type": "dataset",
+                    "bom-ref": "TIGER-Lab/MathInstruct-9d9c997d-f6c1-5029-96fd-6003c4f0ec06",
+                    "name": "TIGER-Lab/MathInstruct",
+                    "contents": {
+                        "url": "https://huggingface.co/datasets/TIGER-Lab/MathInstruct",
+                        "properties": [
+                            {
+                                "name": "task_categories",
+                                "value": "text-generation"
+                            },
+                            {
+                                "name": "language",
+                                "value": "en"
+                            },
+                            {
+                                "name": "size_categories",
+                                "value": "100K<n<1M"
+                            },
+                            {
+                                "name": "pretty_name",
+                                "value": "MathInstruct"
+                            },
+                            {
+                                "name": "license",
+                                "value": "mit"
+                            }
+                        ]
+                    },
+                    "governance": {
+                        "owners": [
+                            {
+                                "organization": {
+                                    "name": "TIGER-Lab",
+                                    "url": "https://huggingface.co/TIGER-Lab"
+                                }
+                            }
+                        ]
+                    },
+                    "description": "\n\t\n\t\t\n\t\t\ud83e\udda3 MAmmoTH: Building Math Generalist Models through Hybrid Instruction Tuning\n\t\n\nMathInstruct is a meticulously curated instruction tuning dataset that is lightweight yet generalizable. MathInstruct is compiled from 13 math rationale datasets, six of which are newly curated by this work. It uniquely focuses on the hybrid use of chain-of-thought (CoT) and program-of-thought (PoT) rationales, and ensures extensive coverage of diverse mathematical fields. \nProject Page:\u2026 See the full description on the dataset page: https://huggingface.co/datasets/TIGER-Lab/MathInstruct."
+                }
+            ]
+        },
+        {
+            "type": "data",
+            "bom-ref": "microsoft/orca-math-word-problems-200k-611afa9f-b6db-5b9f-9a51-598e4ce79d0e",
+            "name": "microsoft/orca-math-word-problems-200k",
+            "data": [
+                {
+                    "type": "dataset",
+                    "bom-ref": "microsoft/orca-math-word-problems-200k-611afa9f-b6db-5b9f-9a51-598e4ce79d0e",
+                    "name": "microsoft/orca-math-word-problems-200k",
+                    "contents": {
+                        "url": "https://huggingface.co/datasets/microsoft/orca-math-word-problems-200k",
+                        "properties": [
+                            {
+                                "name": "task_categories",
+                                "value": "question-answering"
+                            },
+                            {
+                                "name": "language",
+                                "value": "en"
+                            },
+                            {
+                                "name": "size_categories",
+                                "value": "100K<n<1M"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: default {\"split\": \"train\", \"path\": \"data/train-*\"}"
+                            },
+                            {
+                                "name": "license",
+                                "value": "mit"
+                            }
+                        ]
+                    },
+                    "governance": {
+                        "owners": [
+                            {
+                                "organization": {
+                                    "name": "microsoft",
+                                    "url": "https://huggingface.co/microsoft"
+                                }
+                            }
+                        ]
+                    },
+                    "description": "\n\t\n\t\t\n\t\tDataset Card\n\t\n\n\n\nThis dataset contains ~200K grade school math word problems. All the answers in this dataset is generated using Azure GPT4-Turbo. Please refer to Orca-Math: Unlocking the potential of\nSLMs in Grade School Math for details about the dataset construction. \n\n\t\n\t\t\n\t\tDataset Sources\n\t\n\n\n\n\nRepository: microsoft/orca-math-word-problems-200k\nPaper: Orca-Math: Unlocking the potential of\nSLMs in Grade School Math\n\n\n\t\n\t\t\n\t\tDirect Use\n\t\n\n\n\nThis dataset has been designed to\u2026 See the full description on the dataset page: https://huggingface.co/datasets/microsoft/orca-math-word-problems-200k."
+                }
+            ]
+        },
+        {
+            "type": "data",
+            "bom-ref": "camel-ai/math-9f7ffeb0-2fb3-5b72-9ca4-1b461f022e61",
+            "name": "camel-ai/math",
+            "data": [
+                {
+                    "type": "dataset",
+                    "bom-ref": "camel-ai/math-9f7ffeb0-2fb3-5b72-9ca4-1b461f022e61",
+                    "name": "camel-ai/math",
+                    "contents": {
+                        "url": "https://huggingface.co/datasets/camel-ai/math",
+                        "properties": [
+                            {
+                                "name": "task_categories",
+                                "value": "text-generation"
+                            },
+                            {
+                                "name": "language",
+                                "value": "en"
+                            },
+                            {
+                                "name": "pretty_name",
+                                "value": "CAMEL Math"
+                            },
+                            {
+                                "name": "license",
+                                "value": "cc-by-nc-4.0"
+                            }
+                        ]
+                    },
+                    "governance": {
+                        "owners": [
+                            {
+                                "organization": {
+                                    "name": "camel-ai",
+                                    "url": "https://huggingface.co/camel-ai"
+                                }
+                            }
+                        ]
+                    },
+                    "description": "\n\t\n\t\t\n\t\tCAMEL: Communicative Agents for \u201cMind\u201d Exploration of Large Scale Language Model Society\n\t\n\n\nGithub: https://github.com/lightaime/camel\nWebsite: https://www.camel-ai.org/\nArxiv Paper: https://arxiv.org/abs/2303.17760\n\n\n\t\n\t\t\n\t\n\t\n\t\tDataset Summary\n\t\n\nMath dataset is composed of 50K problem-solution pairs obtained using GPT-4. The dataset problem-solutions pairs generating from 25 math topics, 25 subtopics for each topic and 80 problems for each \"topic,subtopic\" pairs.\nWe provide the data\u2026 See the full description on the dataset page: https://huggingface.co/datasets/camel-ai/math."
+                }
+            ]
+        },
+        {
+            "type": "data",
+            "bom-ref": "AtlasUnified/atlas-math-sets-49141027-0c69-515d-8182-254cf889efae",
+            "name": "AtlasUnified/atlas-math-sets",
+            "data": [
+                {
+                    "type": "dataset",
+                    "bom-ref": "AtlasUnified/atlas-math-sets-49141027-0c69-515d-8182-254cf889efae",
+                    "name": "AtlasUnified/atlas-math-sets",
+                    "contents": {
+                        "url": "https://huggingface.co/datasets/AtlasUnified/atlas-math-sets",
+                        "properties": [
+                            {
+                                "name": "task_categories",
+                                "value": "question-answering"
+                            },
+                            {
+                                "name": "language",
+                                "value": "en"
+                            },
+                            {
+                                "name": "size_categories",
+                                "value": "10M<n<100M"
+                            },
+                            {
+                                "name": "pretty_name",
+                                "value": "Atlas Math Sets"
+                            },
+                            {
+                                "name": "license",
+                                "value": "mit"
+                            }
+                        ]
+                    },
+                    "governance": {
+                        "owners": [
+                            {
+                                "organization": {
+                                    "name": "AtlasUnified",
+                                    "url": "https://huggingface.co/AtlasUnified"
+                                }
+                            }
+                        ]
+                    },
+                    "description": "\n\t\n\t\t\n\t\tATLAS MATH SETS\n\t\n\n\nThis set of data consists of mathematical computations. Simple in nature as it derived from python scripts, this dataset contains addition, subtraction, multiplication, division, fractions, decimals, square roots, cube roots, exponents, and factors.\nFormat of the JSONL is as follows:\n{\"answer\": \"[num]\", \"input\": \"[equation]\", \"output\": \"[num]\", \"instruction\": \"[pre-generated_instruction] [equation]\"}\n"
+                }
+            ]
+        },
+        {
+            "type": "data",
+            "bom-ref": "tiedong/goat-38642401-79d7-541d-a92f-d3d7acdb8db8",
+            "name": "tiedong/goat",
+            "data": [
+                {
+                    "type": "dataset",
+                    "bom-ref": "tiedong/goat-38642401-79d7-541d-a92f-d3d7acdb8db8",
+                    "name": "tiedong/goat",
+                    "contents": {
+                        "url": "https://huggingface.co/datasets/tiedong/goat",
+                        "properties": [
+                            {
+                                "name": "task_categories",
+                                "value": "question-answering"
+                            },
+                            {
+                                "name": "language",
+                                "value": "en"
+                            },
+                            {
+                                "name": "size_categories",
+                                "value": "1M<n<10M"
+                            },
+                            {
+                                "name": "license",
+                                "value": "apache-2.0"
+                            }
+                        ]
+                    },
+                    "governance": {
+                        "owners": [
+                            {
+                                "organization": {
+                                    "name": "tiedong",
+                                    "url": "https://huggingface.co/tiedong"
+                                }
+                            }
+                        ]
+                    },
+                    "description": "\n\t\n\t\t\n\t\tDataset Card for Dataset Name\n\t\n\n\n\t\n\t\t\n\t\tDataset Summary\n\t\n\nThe dataset.json file contains ~1.7 million synthetic data for arithmetic tasks, generated by dataset.ipynb.\n\n\t\n\t\t\n\t\tSupported Tasks and Leaderboards\n\t\n\n[More Information Needed]\n\n\t\n\t\t\n\t\tLanguages\n\t\n\n[More Information Needed]\n\n\t\n\t\t\n\t\tDataset Structure\n\t\n\n\n\t\n\t\t\n\t\tData Instances\n\t\n\n[More Information Needed]\n\n\t\n\t\t\n\t\tData Fields\n\t\n\n[More Information Needed]\n\n\t\n\t\t\n\t\tData Splits\n\t\n\n[More Information Needed]\n\n\t\n\t\t\n\t\tDataset Creation\u2026 See the full description on the dataset page: https://huggingface.co/datasets/tiedong/goat."
+                }
+            ]
+        },
+        {
+            "type": "data",
+            "bom-ref": "Lin-Chen/ShareGPT4V-f6982603-3c10-5cd0-9d2d-83d573b61341",
+            "name": "Lin-Chen/ShareGPT4V",
+            "data": [
+                {
+                    "type": "dataset",
+                    "bom-ref": "Lin-Chen/ShareGPT4V-f6982603-3c10-5cd0-9d2d-83d573b61341",
+                    "name": "Lin-Chen/ShareGPT4V",
+                    "contents": {
+                        "url": "https://huggingface.co/datasets/Lin-Chen/ShareGPT4V",
+                        "properties": [
+                            {
+                                "name": "task_categories",
+                                "value": "visual-question-answering, question-answering"
+                            },
+                            {
+                                "name": "language",
+                                "value": "en"
+                            },
+                            {
+                                "name": "size_categories",
+                                "value": "1M<n"
+                            },
+                            {
+                                "name": "pretty_name",
+                                "value": "ShareGPT4V Captions 1.2M Dataset Card"
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: ShareGPT4V \"s\", \"h\", \"a\", \"r\", \"e\", \"g\", \"p\", \"t\", \"4\", \"v\", \"_\", \"i\", \"n\", \"s\", \"t\", \"r\", \"u\", \"c\", \"t\", \"_\", \"g\", \"p\", \"t\", \"4\", \"-\", \"v\", \"i\", \"s\", \"i\", \"o\", \"n\", \"_\", \"c\", \"a\", \"p\", \"1\", \"0\", \"0\", \"k\", \".\", \"j\", \"s\", \"o\", \"n\""
+                            },
+                            {
+                                "name": "configs",
+                                "value": "Name of the dataset subset: ShareGPT4V-PT \"s\", \"h\", \"a\", \"r\", \"e\", \"-\", \"c\", \"a\", \"p\", \"t\", \"i\", \"o\", \"n\", \"e\", \"r\", \"_\", \"c\", \"o\", \"c\", \"o\", \"_\", \"l\", \"c\", \"s\", \"_\", \"s\", \"a\", \"m\", \"_\", \"1\", \"2\", \"4\", \"6\", \"k\", \"_\", \"1\", \"1\", \"0\", \"7\", \".\", \"j\", \"s\", \"o\", \"n\""
+                            },
+                            {
+                                "name": "license",
+                                "value": "cc-by-nc-4.0"
+                            }
+                        ]
+                    },
+                    "governance": {
+                        "owners": [
+                            {
+                                "organization": {
+                                    "name": "Lin-Chen",
+                                    "url": "https://huggingface.co/Lin-Chen"
+                                }
+                            }
+                        ]
+                    },
+                    "description": "\n\t\n\t\t\n\t\tNews\n\t\n\n[2024/5/8] We released ShareGPT4Video, a large-scale video-caption dataset, with 40K captions annotated by GPT4V and 4.8M captions annotated by our ShareCaptioner-Video. The total videos last with 300 hours and 3000 hours separately!\n\n\t\n\t\t\n\t\tShareGPT4V 1.2M Dataset Card\n\t\n\n\n\t\n\t\t\n\t\tDataset details\n\t\n\nDataset type:\nShareGPT4V Captions 1.2M is a set of GPT4-Vision-powered multi-modal captions data.\nIt is constructed to enhance modality alignment and fine-grained visual concept\u2026 See the full description on the dataset page: https://huggingface.co/datasets/Lin-Chen/ShareGPT4V."
+                }
+            ]
+        },
+        {
+            "type": "data",
+            "bom-ref": "jxu124/llava_conversation_58k-7dcd95f0-d26a-5075-89f4-4afc13a5b93f",
+            "name": "jxu124/llava_conversation_58k",
+            "data": [
+                {
+                    "type": "dataset",
+                    "bom-ref": "jxu124/llava_conversation_58k-7dcd95f0-d26a-5075-89f4-4afc13a5b93f",
+                    "name": "jxu124/llava_conversation_58k",
+                    "contents": {
+                        "url": "https://huggingface.co/datasets/jxu124/llava_conversation_58k"
+                    },
+                    "governance": {
+                        "owners": [
+                            {
+                                "organization": {
+                                    "name": "jxu124",
+                                    "url": "https://huggingface.co/jxu124"
+                                }
+                            }
+                        ]
+                    },
+                    "description": "\n\t\n\t\t\n\t\tDataset Card for \"llava_conversation_58k\"\n\t\n\nMore Information needed\n"
+                }
+            ]
+        }
+    ]
+}