Last active
September 10, 2018 09:35
-
-
Save ricardoaat/09439f66d502c29f9ba51c2c286b2f02 to your computer and use it in GitHub Desktop.
Bioschemas dataset implementation example
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
{ | |
"@context": [ "http://schema.org", "http://bioschemas.org/specifications/"], | |
"@type": "Dataset", | |
"@id": "http://www.uniprot.org/uniparc", | |
"name": "UniProt Archive (UniParc)", | |
"description": "The UniProt Archive (UniParc) is a comprehensive and non-redundant database that contains most of the publicly available protein sequences in the world. Proteins may exist in different source databases and in multiple copies in the same database. UniParc avoided such redundancy by storing each unique sequence only once and giving it a stable and unique identifier (UPI) making it possible to identify the same protein from different source databases. A UPI is never removed, changed or reassigned. UniParc contains only protein sequences. All other information about the protein must be retrieved from the source databases using the database cross-references. UniParc tracks sequence changes in the source databases and archives the history of all changes. UniParc has combined many databases into one at the sequence level and searching UniParc is equivalent to searching many databases simultaneously", | |
"url": "http://www.uniprot.org/uniparc", | |
"identifier": "UniParc", | |
"keywords": "protein, protein sequence, archive", | |
"includedInDataCatalog": "http://www.uniprot.org", | |
"creator": { | |
"@type": "Organization", | |
"name": "UniProt Consortium" | |
}, | |
"version": "2017-09", | |
"license": "Creative Commons Attribution-NoDerivs", | |
"distribution": [{ | |
"@type": "DataDownload", | |
"name": "UniParc XML", | |
"fileFormat": "xml", | |
"contentURL": "ftp://ftp.uniprot.org/pub/databases/uniprot/current_release/uniparc/uniparc_all.xml.gz" | |
}, | |
{ | |
"@type": "DataDownload", | |
"name": "UniParc FASTA", | |
"fileFormat": "fasta", | |
"contentURL": "ftp://ftp.uniprot.org/pub/databases/uniprot/current_release/uniparc/uniparc_active.fasta.gz" | |
} | |
] | |
} | |
{ | |
"@context": ["http://schema.org/", "http://http://bioschemas.org/specifications/"], | |
"@type": "Dataset", | |
"datePublished": "2012-03-12", | |
"sourceOrganization": [{ | |
"@type": "Organization", | |
"name": "European Bioinformatics Institute EBI-EMBL" | |
}, { | |
"@type": "Organization", | |
"name": "Swiss Institute of Bioinformatics SIB" | |
}, { | |
"@type": "Organization", | |
"name": "Protein Information Resource PIR" | |
}], | |
"keywords": "PROTEOMICS, BIOLOGICAL SCIENCES, BIOCHEMISTRY AND CELL BIOLOGY, , MEDICAL AND HEALTH SCIENCES, MEDICAL BIOCHEMISTRY AND METABOLOMICS", | |
"inLanguage": "en", | |
"name": "UniProt Proteomes", | |
"description": "Set of proteins thought to be expressed by an organism. UniProt provides proteomes for species with completely sequenced genomes", | |
"identifier": "UniProt Proteomes", | |
"url": "https://www.uniprot.org/proteomes/" | |
} |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment