1. Select all taxa from the UniProt taxonomy

    SELECT ?taxon FROM <http://sparql.uniprot.org/taxonomy> WHERE { ?taxon a up:Taxon . }Use
  2. Select all bacterial taxa and their scientific name from the UniProt taxonomy

    SELECT ?taxon ?name WHERE { ?taxon a up:Taxon . ?taxon up:scientificName ?name . ?taxon rdfs:subClassOf taxon:2 . }Use
  3. Select all UniProt entries, and their organism and amino acid sequences (including isoforms), for _E. coli K12_ and all its strains

    SELECT ?protein ?organism ?isoform ?aa_sequence WHERE { ?protein a up:Protein . ?protein up:organism ?organism . ?organism rdfs:subClassOf* taxon:83333 . ?protein up:sequence ?isoform . ?isoform rdf:value ?aa_sequence . }Use
  4. Select the UniProt entry with the mnemonic 'A4_HUMAN'

    SELECT ?protein WHERE { ?protein a up:Protein . ?protein up:mnemonic 'A4_HUMAN' }Use
  5. Select all cross-references to external databases of the category '3D structure databases' of UniProt entries that are classified with the keyword 'Acetoin biosynthesis (KW-0005)'

    SELECT ?protein ?db WHERE { ?protein a up:Protein ; up:classifiedWith keywords:5 ; rdfs:seeAlso ?db . ?db up:database <http://purl.uniprot.org/database/PDB> }Use
  6. Select all cross-references to external databases of the category '3D structure databases' of UniProt entries that are classified with the keyword 'Acetoin biosynthesis (KW-0005)'

    SELECT DISTINCT ?link WHERE { ?protein a up:Protein . ?protein up:classifiedWith keywords:5 . ?protein rdfs:seeAlso ?link . ?link up:database ?db . ?db up:category '3D structure databases' }Use
  7. Select all UniProt entries, and their recommended protein name, that have a preferred gene name that contains the text 'DNA'

    SELECT ?protein ?name WHERE { ?protein a up:Protein . ?protein up:recommendedName ?recommended . ?recommended up:fullName ?name . ?protein up:encodedBy ?gene . ?gene skos:prefLabel ?text . FILTER CONTAINS(?text, 'DNA') }Use
  8. Select the preferred gene name and disease annotation of all human UniProt entries that are known to be involved in a disease

    SELECT ?name ?text WHERE { ?protein a up:Protein . ?protein up:organism taxon:9606 . ?protein up:encodedBy ?gene . ?gene skos:prefLabel ?name . ?protein up:annotation ?annotation . ?annotation a up:Disease_Annotation . ?annotation rdfs:comment ?text }Use
  9. Select all human UniProt entries with a sequence variant that leads to a 'loss of function'

    SELECT ?protein ?text WHERE { ?protein a up:Protein . ?protein up:organism taxon:9606 . ?protein up:annotation ?annotation . ?annotation a up:Natural_Variant_Annotation . ?annotation rdfs:comment ?text . FILTER (CONTAINS(?text, 'loss of function')) }Use
  10. Select all UniProt entries with annotated transmembrane regions and the regions' begin and end coordinates on the canonical sequence

    SELECT ?protein ?begin ?end WHERE { ?protein a up:Protein . ?protein up:annotation ?annotation . ?annotation a up:Transmembrane_Annotation . ?annotation up:range ?range . ?range faldo:begin/faldo:position ?begin . ?range faldo:end/faldo:position ?end }Use
  11. Select all UniProt entries that were integrated on the 30th of November 2010

    SELECT ?protein WHERE { ?protein a up:Protein . ?protein up:created '2010-11-30'^^xsd:date }Use
  12. Was any UniProt entry integrated on the 9th of January 2013

    ASK WHERE { ?protein a up:Protein . ?protein up:created '2013-01-09'^^xsd:date }Use
  13. Construct new triples of the type 'HumanProtein' from all human UniProt entries

    CONSTRUCT { ?protein a up:HumanProtein . } WHERE { ?protein a up:Protein . ?protein up:organism taxon:9606 }Use
  14. Select all triples that relate to the EMBL CDS entry AA089367.1:

    DESCRIBE <http://purl.uniprot.org/embl-cds/AAO89367.1>Use
  15. Select all triples that relate to the taxon that describes Homo sapiens in the named graph for taxonomy

    DESCRIBE taxon:9606 FROM <http://sparql.uniprot.org/taxonomy>Use
  16. Select the average number of cross-references to the PDB database of UniProt entries that have at least one cross-reference to the PDB database

    SELECT (AVG(?linksToPdbPerEntry) AS ?avgLinksToPdbPerEntry) WHERE { SELECT ?protein (COUNT(DISTINCT ?db) AS ?linksToPdbPerEntry) WHERE { ?protein a up:Protein . ?protein rdfs:seeAlso ?db . ?db up:database &amp;lt;http://purl.uniprot.org/database/PDB&amp;gt; } GROUP BY ?protein ORDER BY DESC(?linksToPdbPerEntry) }Use
  17. Select the number of UniProt entries for each of the EC (Enzyme Commission) second level categories

    SELECT ?enzyme (COUNT(?protein) as ?size) WHERE { VALUES (?ecClass) {(ec:1.-.-.-) (ec:2.-.-.-) (ec:3.-.-.-) (ec:4.-.-.-) (ec:5.-.-.-) (ec:6.-.-.-) (ec:7.-.-.-) } ?protein up:enzyme ?enzyme . ?enzyme rdfs:subClassOf ?ecClass . } GROUP BY ?enzyme ORDER BY ?enzymeUse
  18. Find all Natural Variant Annotations if associated via an evidence tag to an article with a pubmed identifier

    SELECT ?accession ?annotation_acc ?pubmed WHERE { ?protein a up:Protein ; up:annotation ?annotation . ?annotation a up:Natural_Variant_Annotation . ?linkToEvidence rdf:object ?annotation ; up:attribution ?attribution . ?attribution up:source ?source . ?source a up:Journal_Citation . BIND(SUBSTR(STR(?protein),33) AS ?accession) BIND(IF(CONTAINS(STR(?annotation), "#SIP"), SUBSTR(STR(?annotation),33), SUBSTR(STR(?annotation),36))AS?annotation_acc) BIND(SUBSTR(STR(?source),35) AS ?pubmed) }Use
  19. Find how often an article in pubmed was used in an evidence tag (ordered by most used to least)

    SELECT ?source (COUNT(?attribution) AS ?attribitions) WHERE { ?protein a up:Protein ; up:annotation ?annotation . ?linkToEvidence rdf:object ?annotation ; up:attribution ?attribution . ?attribution up:source ?source . ?source a up:Journal_Citation . } GROUP BY ?source ORDER BY DESC(COUNT(?attribution))Use
  20. Find where disease related proteins are known to be located in the cell

    SELECT ?protein ?disease ?location_inside_cell ?cellcmpt WHERE { ?protein up:annotation ?diseaseAnnotation , ?subcellAnnotation . ?diseaseAnnotation up:disease/skos:prefLabel ?disease . ?subcellAnnotation up:locatedIn/up:cellularComponent ?cellcmpt . ?cellcmpt skos:prefLabel ?location_inside_cell . }Use
  21. For two accessions find the GO term labels and group them into GO process,function and component

    SELECT (CONCAT(SUBSTR(STR(?protein), 33)) AS ?uniprot) (GROUP_CONCAT(?celtype; separator=";") AS ?celtypes) (GROUP_CONCAT(?biotype; separator=";") AS ?biotypes) (GROUP_CONCAT(?moltype; separator=";") AS ?moltypes) WHERE { VALUES (?ac) {("Q6GZX4") ("Q96375")} BIND (IRI(CONCAT("http://purl.uniprot.org/uniprot/",?ac)) AS ?protein) ?protein a up:Protein . ?protein up:classifiedWith ?goTerm . #Determine if the type is biological_process OPTIONAL { ?goTerm rdfs:subClassOf <http://purl.obolibrary.org/obo/GO_0008150>. ?goTerm rdfs:label ?biotype . } #Determine if the type is cellular_component OPTIONAL { ?goTerm rdfs:subClassOf <http://purl.obolibrary.org/obo/GO_0005575>. ?goTerm rdfs:label ?celtype . } #Determine if the type is molecular_function OPTIONAL { ?goTerm rdfs:subClassOf <http://purl.obolibrary.org/obo/GO_0003674> . ?goTerm rdfs:label ?moltype . } #Filter out the uniprot keywords FILTER(bound(?biotype) || bound(?celtype) || bound(?moltype)) } GROUP BY ?proteinUse
  22. Number of reviewed entries (Swiss-Prot) that are related to kinase activity

    SELECT (COUNT(DISTINCT(?protein)) AS ?pc) WHERE { ?protein rdf:type up:Protein ; up:reviewed true ; up:organism taxon:9606 ; up:classifiedWith|(up:classifiedWith/rdfs:subClassOf) GO:0016301 . }Use
  23. Find the release number of the uniprot data that is currently being queried

    SELECT ?version FROM <http://sparql.uniprot.org/.well-known/void> WHERE { [] <http://purl.org/pav/2.0/version> ?version }Use
  24. Find any uniprot entry which has a name 'HLA class I histocompatibility antigen, B-73 alpha chain'

    SELECT ?protein ?anyKindOfName WHERE { ?protein a up:Protein . ?protein (up:recommendedName|up:alternativeName) ?structuredName . ?structuredName ?anyKindOfName "HLA class I histocompatibility antigen, B-73 alpha chain" . ?anyKindOfName rdfs:subPropertyOf up:structuredNameType . }Use
  25. Find any uniprot entry, or an uniprot entries domain or component which has a name 'HLA class I histocompatibility antigen, B-73 alpha chain'

    SELECT ?protein ?anyKindOfName WHERE { ?protein a up:Protein . ?protein (up:recommendedName|up:alternativeName)|((up:domain|up:component)/(up:recommendedName|up:alternativeName)) ?structuredName . ?structuredName ?anyKindOfName "HLA class I histocompatibility antigen, B-73 alpha chain" . ?anyKindOfName rdfs:subPropertyOf up:structuredNameType . }Use