<entry xmlns="http://pdbe.org/empiar" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="https://ftp.ebi.ac.uk/pub/databases/emtest/empiar/schema/empiar.xsd" accessionCode="EMPIAR-11035" public="true">
    <admin>
        <currentStatus>REL</currentStatus>
        <keyDates>
            <depositionDate>2022-04-28</depositionDate>
            <releaseDate>2022-05-20</releaseDate>
            <updateDate>2022-05-20</updateDate>
        </keyDates>
        <title>CEM1.5M : a cellular EM dataset containing ~1.5 x 106 unlabeled 2D image patches curated for deep learning</title>
        <correspondingAuthor>
            <authorORCID>0000-0001-7982-6494</authorORCID>
            <firstName>Kedar</firstName>
            <lastName>Narayan</lastName>
            <organization type="academic">NCI/FNLCR</organization>
            <townOrCity>Frederick</townOrCity>
            <stateOrProvince>MD</stateOrProvince>
            <country>United States</country>
            <postOrZipCode>21701</postOrZipCode>
        </correspondingAuthor>
        <principalInvestigator>
            <authorORCID>0000-0001-7982-6494</authorORCID>
            <firstName>Kedar</firstName>
            <lastName>Narayan</lastName>
            <organization type="academic">NCI/FNLCR</organization>
            <townOrCity>Frederick</townOrCity>
            <stateOrProvince>MD</stateOrProvince>
            <country>United States</country>
            <postOrZipCode>21701</postOrZipCode>
        </principalInvestigator>
        <authorsList>
            <author authorORCID="0000-0001-7982-6494">Narayan K</author>
        </authorsList>
        <datasetSize>57.6</datasetSize>
        <entryDOI>10.6019/EMPIAR-11035</entryDOI>
        <experimentType>FIB-SEM</experimentType>
    </admin>
    <crossReferences>
        <citationList>
            <universalCitation>
                <journalCitation published="false" preprint="false">
                    <author authorORCID="0000-0001-7982-6494" order="1">Narayan K</author>
                    <title>Instance segmentation of mitochondria in electron microscopy images with a generalist deep learning model</title>
                    <journal></journal>
                    <journalAbbreviation></journalAbbreviation>
                    <country></country>
                </journalCitation>
            </universalCitation>
        </citationList>
        <relatedEmpiarEntries>
            <empiarEntry>EMPIAR-11037</empiarEntry>
        </relatedEmpiarEntries>
    </crossReferences>
    <imageSet>
        <name>1,592,753 unlabeled 2D cellular EM (CEM1.5M) image dataset curated for deep learning</name>
        <directory>/data</directory>
        <category>micrographs - single frame</category>
        <headerFormat>TIFF</headerFormat>
        <dataFormat>TIFF</dataFormat>
        <numImagesOrTiltSeries>1592753</numImagesOrTiltSeries>
        <framesPerImage>1</framesPerImage>
        <voxelType>UNSIGNED BYTE</voxelType>
        <dimensions>
            <imageWidth>224</imageWidth>
            <pixelWidth>variable</pixelWidth>
            <imageHeight>224</imageHeight>
            <pixelHeight>variable</pixelHeight>
        </dimensions>
        <details>This zip file contains 1,592,753 heterogeneous, information-rich, non-redundant unlabeled 2D cellular EM (hence CEM1.5M) images, divided into 651 subdirectories (each directory being a unique vEM or EM image set). The image patches are mostly 224 x 224 pixels, however some are 512 x 512, and some are smaller. The raw image data was curated for deep learning largely following Conrad and Narayan, eLife 2021. https://elifesciences.org/articles/65894</details>
        <segmentationList/>
        <micrographsFilePattern></micrographsFilePattern>
        <pickedParticlesFilePattern></pickedParticlesFilePattern>
        <pickedParticlesDirectory></pickedParticlesDirectory>
    </imageSet>
</entry>
