82_rhea_reactions_associated_with_ec_in_uniprotkb: List Rhea reactions associated with an EC (enzyme classification).

 
1
PREFIX up: <http://purl.uniprot.org/core/>
2
SELECT 
3
  ?rhea 
4
  ?EC 
5
WHERE {
6
  ?CatalyticActivity  up:catalyzedReaction   ?rhea ;
7
    up:enzymeClass         ?EC .
8
}
Use

83_rhea_reactions_not_associated_with_ec_in_uniprotkb: List Rhea reactions that are not associated with an EC (enzyme classification).

xxxxxxxxxx
10
 
1
PREFIX up: <http://purl.uniprot.org/core/>
2
SELECT 
3
  ?rhea 
4
  ?EC 
5
WHERE {
6
  ?CatalyticActivity up:catalyzedReaction ?rhea .
7
  MINUS {
8
    ?CatalyticActivity up:enzymeClass ?EC .
9
  }
10
}
Use

84_taxonomy_hierarchy: Find all taxonomic records that describe species of the genus Homo.

xxxxxxxxxx
14
 
1
PREFIX rdfs: <http://www.w3.org/2000/01/rdf-schema#>
2
PREFIX taxon: <http://purl.uniprot.org/taxonomy/>
3
PREFIX up: <http://purl.uniprot.org/core/>
4
SELECT 
5
  ?species 
6
  ?genus 
7
WHERE {
8
  BIND(taxon:9605 AS ?genus)
9
  ?species a up:Taxon ;
10
           up:rank up:Species ;
11
           rdfs:subClassOf ?genus .
12
  ?genus a up:Taxon ;
13
         up:rank up:Genus .
14
}
Use

85_taxonomy_host: Find taxon records that are known to have part of their life cycle in other organisms (e.g. parasite, symbiont, infection)

xxxxxxxxxx
7
 
1
PREFIX up: <http://purl.uniprot.org/core/>
2
SELECT 
3
  ?virus 
4
  ?host 
5
WHERE {
6
    ?virus up:host ?host .
7
}
Use

86_taxonomy_rank_and_scientific_name: Retrieve the rank and the scientific name of an taxonomic record. Not all taxonomic records have a rank associated with them.

xxxxxxxxxx
12
 
1
PREFIX up: <http://purl.uniprot.org/core/>
2
SELECT
3
  ?taxon 
4
  ?scientificName
5
  ?rank
6
WHERE {
7
  ?taxon a up:Taxon ;
8
         up:scientificName ?scientificName .
9
  OPTIONAL {
10
    ?taxon up:rank ?rank
11
  }
12
}
Use

87_taxonomy_with_at_least_one_swissprot: Find taxon records for which one reviewed UniProtKB/Swiss-Prot entry exists. We might expect species, strains, subspecies and isolates in the taxon list.

xxxxxxxxxx
23
 
1
PREFIX rdfs: <http://www.w3.org/2000/01/rdf-schema#>
2
PREFIX taxon: <http://purl.uniprot.org/taxonomy/>
3
PREFIX up: <http://purl.uniprot.org/core/>
4
SELECT
5
    DISTINCT
6
         ?taxid
7
         ?scientificName
8
         ?domain
9
         ?domainName
10
WHERE {
11
  ?uniprot a up:Protein .
12
  # reviewed entries
13
  ?uniprot up:reviewed true .
14
  ?uniprot up:organism ?taxid . 
15
  ?taxid up:scientificName ?scientificName .
16
    
17
  VALUES ?domain { taxon:2 # bacteria
18
                   taxon:2157 # archaea
19
                   taxon:2759 # eukaryota
20
                   taxon:10239 #viruses
21
                 } .
22
  ?taxid rdfs:subClassOf ?domain .
23
}
Use

88_uniparc_linked_to_active_uniprot: Show for a given UniParc accessions which active UniProtKB entries have the same amino acid sequence

xxxxxxxxxx
13
 
1
PREFIX up: <http://purl.uniprot.org/core/>
2
SELECT 
3
  ?uniparc
4
  ?uniprot
5
WHERE {
6
  GRAPH <http://sparql.uniprot.org/uniparc>{
7
    BIND(<http://purl.uniprot.org/uniparc/UPI000002DB1C> AS ?uniparc) 
8
    ?uniparc up:sequenceFor ?uniprot .
9
  }
10
  GRAPH <http://sparql.uniprot.org/uniprot> {
11
    ?uniprot a up:Protein .
12
  }
13
}
Use

89_uniparc_triples_directly_associated: Predicates and objects, for a given UniParc accession as a subject

xxxxxxxxxx
7
 
1
PREFIX up: <http://purl.uniprot.org/core/>
2
SELECT 
3
  ?predicate 
4
  ?object 
5
WHERE { 
6
  <http://purl.uniprot.org/uniparc/UPI000012A0AD> ?predicate ?object
7
}
Use

90_uniprot_affected_by_metabolic_diseases_using_MeSH: Proteins involved in metabolic diseases in UniProtKB. Using the MeSH concept as a root to find metabolic diseases in UniProt.

xxxxxxxxxx
21
 
1
PREFIX rdfs: <http://www.w3.org/2000/01/rdf-schema#>
2
PREFIX up: <http://purl.uniprot.org/core/>
3
SELECT
4
 ?disease ?protein
5
WHERE {
6
  SERVICE<https://id.nlm.nih.gov/mesh/sparql> {
7
    GRAPH <http://id.nlm.nih.gov/mesh> {
8
      # Mesh M0013493 is a meaningless gathering about the concept 'Metabolic Diseases'
9
      ?mesh <http://id.nlm.nih.gov/mesh/vocab#broaderDescriptor>* ?broader .
10
      ?broader <http://id.nlm.nih.gov/mesh/vocab#preferredConcept> <http://id.nlm.nih.gov/mesh/M0013493> .
11
    }
12
  }
13
  GRAPH <http://sparql.uniprot.org/diseases>{
14
    ?disease a up:Disease ;
15
        rdfs:seeAlso ?mesh .
16
    ?mesh up:database <http://purl.uniprot.org/database/MeSH> .
17
  }
18
  GRAPH <http://sparql.uniprot.org/uniprot> {
19
     ?protein up:annotation/up:disease ?disease . 
20
  }
21
}
Use

91_uniprot_alternative_protein_full_name: Alternative protein full names for UniProtKB entries

xxxxxxxxxx
8
 
1
PREFIX up: <http://purl.uniprot.org/core/>
2
SELECT ?protein 
3
  ?fullName
4
WHERE {
5
  ?protein a up:Protein ;
6
           up:alternativeName ?recommendedName .
7
  ?recommendedName up:fullName ?fullName .
8
}
Use

92_uniprot_bioregistry_iri_translation: Translate the global unique identifier for a UniProtKB record into other options using the bioregistry translating endpoint.

xxxxxxxxxx
13
 
1
PREFIX owl: <http://www.w3.org/2002/07/owl#>
2
PREFIX uniprotkb: <http://purl.uniprot.org/uniprot/>
3
PREFIX up: <http://purl.uniprot.org/core/>
4
SELECT 
5
    ?protein 
6
    ?otherIdentifier
7
WHERE {
8
    BIND(uniprotkb:P00750 AS ?protein)
9
    ?protein a up:Protein .
10
    SERVICE <https://bioregistry.io/sparql> {
11
        ?protein owl:sameAs ?otherIdentifier .
12
    }
13
}
Use

93_uniprot_created_modified_updated: List the created, last modified, and last sequence update dates for UniProtKB proteins.

xxxxxxxxxx
12
 
1
PREFIX up: <http://purl.uniprot.org/core/>
2
SELECT
3
  ?protein 
4
  ?created
5
  ?modified
6
  ?version
7
WHERE {
8
  ?protein a up:Protein ;
9
           up:created ?created ;
10
           up:modified ?modified ;
11
           up:version ?version .
12
}
Use

94_uniprot_encoding_gene: List UniProtKB proteins with their associated named gene

xxxxxxxxxx
7
 
1
PREFIX up: <http://purl.uniprot.org/core/>
2
SELECT ?protein
3
  ?gene 
4
WHERE {
5
  ?protein a up:Protein ;
6
           up:encodedBy ?gene .
7
}
Use

96_uniprot_encoding_gene_name: List UniProtKB proteins with their associated gene and the gene's preffered name

xxxxxxxxxx
9
 
1
PREFIX skos: <http://www.w3.org/2004/02/skos/core#>
2
PREFIX up: <http://purl.uniprot.org/core/>
3
SELECT ?protein
4
  ?gene 
5
WHERE {
6
  ?protein a up:Protein ;
7
           up:encodedBy ?gene .
8
  ?gene skos:prefLabel ?recommendedGeneName .
9
}
Use

97_uniprot_encoding_gene_org_name: List UniProtKB proteins with their associated gene and the gene's ORF label

xxxxxxxxxx
9
 
1
PREFIX up: <http://purl.uniprot.org/core/>
2
SELECT
3
  ?gene 
4
  ?orfName
5
WHERE {
6
  ?protein a up:Protein ;
7
           up:encodedBy ?gene .
8
  ?gene up:orfName ?orfName .
9
}
Use

98_uniprot_entries_with_more_than_two_geneid_crossrefences: Find GeneID's crosslinked to more than one human or mouse UniProtKB entry

xxxxxxxxxx
14
 
1
PREFIX rdfs: <http://www.w3.org/2000/01/rdf-schema#>
2
PREFIX up: <http://purl.uniprot.org/core/>
3
PREFIX taxon:<http://purl.uniprot.org/taxon/>
4
SELECT 
5
  ?geneid 
6
  ?organism 
7
  (GROUP_CONCAT(?protein; separator=', ') AS ?entries)
8
WHERE
9
{
10
  VALUES ?organism {taxon:9606 taxon:10090}
11
  ?geneid up:database <http://purl.uniprot.org/database/GeneID> .
12
  ?protein rdfs:seeAlso ?geneid ; 
13
           up:organism ?organism
14
} GROUP BY ?geneid ?organism HAVING (COUNT(?protein) > 1) ORDER BY ?organism ?geneid
Use

99_uniprot_identifiers_org_translation: Translate a selection of UniProtKB accession numbers into other options using the identifiers.org translating endpoint.

xxxxxxxxxx
13
 
1
PREFIX owl: <http://www.w3.org/2002/07/owl#>
2
PREFIX uniprotkb: <http://purl.uniprot.org/uniprot/>
3
PREFIX up: <http://purl.uniprot.org/core/>
4
SELECT 
5
    ?protein 
6
    ?otherIdentifier
7
WHERE {
8
    VALUES (?protein) {(uniprotkb:P00750) (uniprotkb:P05067)}
9
    ?protein a up:Protein .
10
    SERVICE <https://sparql.api.identifiers.org/sparql> {
11
        ?protein owl:sameAs ?otherIdentifier .
12
    }
13
}
Use

drosophila_enzymes_derived_from_at_least_two_mRNAs: Find Drosophila proteins, that depend on more than one transcript (requires cross-references to Ensembl family of resources).

xxxxxxxxxx
12
 
1
PREFIX rdfs: <http://www.w3.org/2000/01/rdf-schema#>
2
PREFIX taxon: <http://purl.uniprot.org/taxonomy/>
3
PREFIX up: <http://purl.uniprot.org/core/>
4
SELECT
5
  ?protein
6
WHERE {
7
  ?protein up:organism taxon:7227 ;
8
    a up:Protein ;
9
    up:reviewed true ;
10
    rdfs:seeAlso ?transcript .
11
  ?transcript  a up:Transcript_Resource .
12
} GROUP BY ?protein HAVING(COUNT(?transcript) >= 2)
Use

drosophila_proteins_derived_from_at_least_two_mRNAs: Find Drosophila enzymes, that depend on more than one transcript (requires cross-references to Ensembl family of resources).

xxxxxxxxxx
17
 
1
PREFIX rdfs: <http://www.w3.org/2000/01/rdf-schema#>
2
PREFIX taxon: <http://purl.uniprot.org/taxonomy/>
3
PREFIX up: <http://purl.uniprot.org/core/>
4
SELECT
5
  ?protein
6
WHERE {
7
  ?protein up:organism taxon:7227 ;
8
    a up:Protein ;
9
    up:reviewed true ;
10
    rdfs:seeAlso ?transcript .
11
  {
12
    ?protein up:annotation/a up:Catalytic_Activity_Annotation ;
13
  } UNION {
14
    ?protein up:enzyme ?enzyme .
15
  }
16
  ?transcript  a up:Transcript_Resource .
17
} GROUP BY ?protein HAVING(COUNT(?transcript) >= 2)
Use

enzyme_with_threonine_as_active_site: Find enzymes with a Tyrosine (Y) as an active site

xxxxxxxxxx
15
 
1
PREFIX faldo: <http://biohackathon.org/resource/faldo#>
2
PREFIX rdf: <http://www.w3.org/1999/02/22-rdf-syntax-ns#>
3
PREFIX up: <http://purl.uniprot.org/core/>
4
SELECT
5
  ?protein
6
WHERE {
7
  ?protein up:annotation ?activeSiteAnnotation .
8
  ?activeSiteAnnotation a up:Active_Site_Annotation ;
9
    up:range ?range .
10
  ?range faldo:begin ?begin .
11
  ?begin faldo:position ?beginPosition ;
12
    faldo:reference ?sequence .
13
  ?sequence rdf:value ?sequenceVal .
14
  FILTER(SUBSTR(?sequenceVal, ?beginPosition, 1) = 'Y')
15
}
Use

uniprot_encoding_gene_name_alternative_name: List UniProtKB proteins with their associated gene and the gene's names that are used in the field, but not recommended for use by UniProtKB

xxxxxxxxxx
9
 
1
PREFIX skos: <http://www.w3.org/2004/02/skos/core#>
2
PREFIX up: <http://purl.uniprot.org/core/>
3
SELECT ?protein
4
  ?gene ?altGeneName
5
WHERE {
6
  ?protein a up:Protein ;
7
           up:encodedBy ?gene .
8
  ?gene skos:altLabel ?altGeneName .
9
}
Use