{ "cells": [ { "metadata": {}, "cell_type": "markdown", "source": [ "# GO Annotation Analysis\n", "\n", "Analyzes the associations between genes and GO terms in the Gene Ontology (GO) database.\n", "\n", "In particular, categorizes associations based on:\n", "\n", "- whether they have been \"retracted\" (i.e., removed from the database)\n", "- whether they have been reviewed and accepted or rejected via IBA" ], "id": "e82528c7acc91898" }, { "metadata": { "collapsed": true, "ExecuteTime": { "end_time": "2025-01-16T01:01:52.125658Z", "start_time": "2025-01-16T01:01:52.121736Z" } }, "cell_type": "code", "source": [ "import pandas as pd\n", "\n", "from tests.test_implementations.test_robot_template import adapter\n", "\n", "# a recent release plus an older one that may have retracted entries\n", "\n", "RELEASES = [\n", " \"2024-11-03\",\n", " \"2024-06-10\",\n", " \"2020-01-01\",\n", "]\n", "\n", "LATEST = RELEASES[0]\n", "PREVIOUS = RELEASES[1:]\n", "assert all(r < LATEST for r in PREVIOUS)" ], "id": "initial_id", "outputs": [], "execution_count": 1 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T01:01:52.132069Z", "start_time": "2025-01-16T01:01:52.129698Z" } }, "cell_type": "code", "source": "NEW_CUTOFF = \"2024-06-01\"", "id": "49978ca9b485fbb2", "outputs": [], "execution_count": 2 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T01:01:52.281969Z", "start_time": "2025-01-16T01:01:52.279065Z" } }, "cell_type": "code", "source": [ "# taxa to analyze\n", "\n", "TAXA = [\n", " (\"human\", \"goa_human\", 9606),\n", " (\"Arabidopsis thaliana\", \"tair\", 3702),\n", " (\"yeast\", \"sgd\", 559292),\n", "]" ], "id": "6018e587719b9375", "outputs": [], "execution_count": 3 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T01:01:52.292074Z", "start_time": "2025-01-16T01:01:52.289520Z" } }, "cell_type": "code", "source": "GAF_URL_TEMPLATE = \"https://release.geneontology.org/{date}/annotations/{name}.gaf.gz\"", "id": "7308ce91009184f6", "outputs": [], "execution_count": 4 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T01:01:54.402787Z", "start_time": "2025-01-16T01:01:52.338558Z" } }, "cell_type": "code", "source": "from oaklib.datamodels.vocabulary import IS_A, PART_OF", "id": "e5d71d36e84b2d23", "outputs": [], "execution_count": 5 }, { "metadata": {}, "cell_type": "markdown", "source": "## Create an OAK adapter for the GO ontology", "id": "aa0baac1347bdbad" }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T01:02:10.701075Z", "start_time": "2025-01-16T01:01:54.406977Z" } }, "cell_type": "code", "source": [ "from oaklib import get_adapter\n", "\n", "go = get_adapter(\"sqlite:obo:go\")" ], "id": "5ec745bd2131923d", "outputs": [ { "data": { "text/plain": [ "Downloading go.db.gz: 0.00B [00:00, ?B/s]" ], "application/vnd.jupyter.widget-view+json": { "version_major": 2, "version_minor": 0, "model_id": "aaf16a6ab071468590f8ec5a8690270e" } }, "metadata": {}, "output_type": "display_data" } ], "execution_count": 6 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T01:02:11.205688Z", "start_time": "2025-01-16T01:02:10.709344Z" } }, "cell_type": "code", "source": "obsoletes = set(go.obsoletes())", "id": "2639655a1230be36", "outputs": [], "execution_count": 7 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T01:02:11.219520Z", "start_time": "2025-01-16T01:02:11.217763Z" } }, "cell_type": "code", "source": "", "id": "323074c9573b3799", "outputs": [], "execution_count": null }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T01:02:12.966565Z", "start_time": "2025-01-16T01:02:11.231132Z" } }, "cell_type": "code", "source": "binding_terms = set(go.descendants(\"GO:0005488\", predicates=[IS_A]))", "id": "a75d36046527380e", "outputs": [], "execution_count": 8 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T01:02:13.187408Z", "start_time": "2025-01-16T01:02:12.977295Z" } }, "cell_type": "code", "source": [ "antislim_terms = set(go.subset_members(\"gocheck_do_not_annotate\")).union(go.subset_members(\"gocheck_obsoletion_candidate\"))\n", "non_informative = binding_terms.union(antislim_terms)\n" ], "id": "7c29df1790c1eaa", "outputs": [], "execution_count": 9 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T07:06:14.986685Z", "start_time": "2025-01-16T07:06:09.128386Z" } }, "cell_type": "code", "source": [ "mf_terms = set(go.descendants(\"GO:0003674\", predicates=[IS_A]))\n", "bp_terms = set(go.descendants(\"GO:0008150\", predicates=[IS_A]))\n", "cc_terms = set(go.descendants(\"GO:0005575\", predicates=[IS_A]))" ], "id": "ea09b5a5d4b41a41", "outputs": [], "execution_count": 96 }, { "metadata": {}, "cell_type": "markdown", "source": "## Load annotations from the archive", "id": "90bdc6b371566c7d" }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T01:02:13.215121Z", "start_time": "2025-01-16T01:02:13.212662Z" } }, "cell_type": "code", "source": [ "from oaklib.parsers import GafAssociationParser\n", "gaf_parser = GafAssociationParser()" ], "id": "1ff5c9430db09c", "outputs": [], "execution_count": 10 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T01:02:13.232733Z", "start_time": "2025-01-16T01:02:13.228Z" } }, "cell_type": "code", "source": [ "import requests_cache\n", "\n", "session = requests_cache.CachedSession(\n", " cache_name='gaf_cache',\n", " backend='sqlite', # or 'memory' for in-memory cache\n", " expire_after=24*60*60, # Cache expiration in seconds\n", " allowable_codes=[200], # Only cache successful responses\n", ")" ], "id": "6a60e3aaac287013", "outputs": [], "execution_count": 11 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T01:02:19.564028Z", "start_time": "2025-01-16T01:02:19.559273Z" } }, "cell_type": "code", "source": [ "from oaklib.datamodels.association import ParserConfiguration, NegatedAssociation\n", "import io\n", "import gzip\n", "\n", "def get_gaf(release, name):\n", " config = ParserConfiguration(preserve_negated_associations=True)\n", " url = GAF_URL_TEMPLATE.format(date=release, name=name)\n", " # open the URL as a file object using requests\n", " with session.get(url, stream=True) as response:\n", " # Decompress the gzipped content and create a text stream\n", " decompressed = gzip.decompress(response.content)\n", " text_stream = io.TextIOWrapper(io.BytesIO(decompressed))\n", " print(f\"Reading {url} using {config}\")\n", " return list(gaf_parser.parse(text_stream, configuration=config))" ], "id": "e094a1d0a870069f", "outputs": [], "execution_count": 12 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T01:02:40.209582Z", "start_time": "2025-01-16T01:02:40.207433Z" } }, "cell_type": "code", "source": "", "id": "a17102634f83407", "outputs": [], "execution_count": null }, { "metadata": {}, "cell_type": "markdown", "source": "## Load all annotations into a cache", "id": "1eb89218612607dd" }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T01:05:30.983720Z", "start_time": "2025-01-16T01:02:42.258853Z" } }, "cell_type": "code", "source": [ "from collections import defaultdict\n", "\n", "db = defaultdict(dict)\n", "for r in RELEASES:\n", " for name, grp, tax_id in TAXA:\n", " print(f\"Loading {r} {name}\")\n", " assocs = get_gaf(r, grp)\n", " print(f\"Loaded {len(assocs)} associations\")\n", " neg_assocs = [x for x in assocs if x.negated]\n", " print(f\" {len(neg_assocs)} negated associations\")\n", " db[grp][r] = assocs" ], "id": "d81f4578bced71a7", "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Loading 2024-11-03 human\n", "Reading https://release.geneontology.org/2024-11-03/annotations/goa_human.gaf.gz using ParserConfiguration(preserve_negated_associations=True, include_association_attributes=None, primary_knowledge_source=None, aggregator_knowledge_source=None)\n", "Loaded 782823 associations\n", " 1494 negated associations\n", "Loading 2024-11-03 Arabidopsis thaliana\n", "Reading https://release.geneontology.org/2024-11-03/annotations/tair.gaf.gz using ParserConfiguration(preserve_negated_associations=True, include_association_attributes=None, primary_knowledge_source=None, aggregator_knowledge_source=None)\n", "Loaded 235371 associations\n", " 1374 negated associations\n", "Loading 2024-11-03 yeast\n", "Reading https://release.geneontology.org/2024-11-03/annotations/sgd.gaf.gz using ParserConfiguration(preserve_negated_associations=True, include_association_attributes=None, primary_knowledge_source=None, aggregator_knowledge_source=None)\n", "Loaded 120823 associations\n", " 6 negated associations\n", "Loading 2024-06-10 human\n", "Reading https://release.geneontology.org/2024-06-10/annotations/goa_human.gaf.gz using ParserConfiguration(preserve_negated_associations=True, include_association_attributes=None, primary_knowledge_source=None, aggregator_knowledge_source=None)\n", "Loaded 707168 associations\n", " 1308 negated associations\n", "Loading 2024-06-10 Arabidopsis thaliana\n", "Reading https://release.geneontology.org/2024-06-10/annotations/tair.gaf.gz using ParserConfiguration(preserve_negated_associations=True, include_association_attributes=None, primary_knowledge_source=None, aggregator_knowledge_source=None)\n", "Loaded 235504 associations\n", " 1373 negated associations\n", "Loading 2024-06-10 yeast\n", "Reading https://release.geneontology.org/2024-06-10/annotations/sgd.gaf.gz using ParserConfiguration(preserve_negated_associations=True, include_association_attributes=None, primary_knowledge_source=None, aggregator_knowledge_source=None)\n", "Loaded 117290 associations\n", " 7 negated associations\n", "Loading 2020-01-01 human\n", "Reading https://release.geneontology.org/2020-01-01/annotations/goa_human.gaf.gz using ParserConfiguration(preserve_negated_associations=True, include_association_attributes=None, primary_knowledge_source=None, aggregator_knowledge_source=None)\n", "Loaded 495361 associations\n", " 1244 negated associations\n", "Loading 2020-01-01 Arabidopsis thaliana\n", "Reading https://release.geneontology.org/2020-01-01/annotations/tair.gaf.gz using ParserConfiguration(preserve_negated_associations=True, include_association_attributes=None, primary_knowledge_source=None, aggregator_knowledge_source=None)\n", "Loaded 236821 associations\n", " 1364 negated associations\n", "Loading 2020-01-01 yeast\n", "Reading https://release.geneontology.org/2020-01-01/annotations/sgd.gaf.gz using ParserConfiguration(preserve_negated_associations=True, include_association_attributes=None, primary_knowledge_source=None, aggregator_knowledge_source=None)\n", "Loaded 120916 associations\n", " 28 negated associations\n" ] } ], "execution_count": 13 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T01:05:31.064502Z", "start_time": "2025-01-16T01:05:31.055034Z" } }, "cell_type": "code", "source": "db[\"goa_human\"][LATEST][0]", "id": "69f2c5dd1f8ff101", "outputs": [ { "data": { "text/plain": [ "Association(subject='UniProtKB:A0A024RBG1', predicate='enables', object='GO:0003723', property_values=[], subject_label='NUDT4B', predicate_label=None, object_label=None, negated=None, publications=['GO_REF:0000043'], evidence_type='IEA', supporting_objects=[], primary_knowledge_source='infores:UniProt', aggregator_knowledge_source=None, subject_closure=[], subject_closure_label=[], object_closure=[], object_closure_label=[], comments=[])" ] }, "execution_count": 14, "metadata": {}, "output_type": "execute_result" } ], "execution_count": 14 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T01:05:47.777533Z", "start_time": "2025-01-16T01:05:47.546272Z" } }, "cell_type": "code", "source": "len([x for x in db[\"goa_human\"][LATEST] if x.negated])", "id": "846c6083be22e228", "outputs": [ { "data": { "text/plain": [ "1494" ] }, "execution_count": 15, "metadata": {}, "output_type": "execute_result" } ], "execution_count": 15 }, { "metadata": {}, "cell_type": "code", "outputs": [], "execution_count": null, "source": "# reload modules\n", "id": "f3648e6d2ebabe76" }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T02:04:51.451900Z", "start_time": "2025-01-16T02:04:42.035195Z" } }, "cell_type": "code", "source": "%load_ext autoreload\n", "id": "4e24da22a5fb7756", "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "The autoreload extension is already loaded. To reload it, use:\n", " %reload_ext autoreload\n" ] } ], "execution_count": 30 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T03:00:50.738855Z", "start_time": "2025-01-16T03:00:50.712857Z" } }, "cell_type": "code", "source": "%autoreload 0", "id": "6c73a0e816464015", "outputs": [], "execution_count": 53 }, { "metadata": {}, "cell_type": "markdown", "source": "## Diffs by terms", "id": "9bc1bc750a447e06" }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T02:05:08.920771Z", "start_time": "2025-01-16T02:05:08.917999Z" } }, "cell_type": "code", "source": "", "id": "ec7960ee3ab0d9da", "outputs": [], "execution_count": null }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T02:05:40.040840Z", "start_time": "2025-01-16T02:05:39.993321Z" } }, "cell_type": "code", "source": [ "from oaklib.utilities.associations.association_differ import AssociationDiffer\n", "\n", "\n", "differ = AssociationDiffer(adapter=go)" ], "id": "a349de5baadc2204", "outputs": [], "execution_count": 32 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T02:05:40.073956Z", "start_time": "2025-01-16T02:05:40.049886Z" } }, "cell_type": "code", "source": "cache = {}", "id": "f6e2c4e58aca3bde", "outputs": [], "execution_count": 33 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T03:37:40.874524Z", "start_time": "2025-01-16T03:37:40.870953Z" } }, "cell_type": "code", "source": "len(db[\"goa_human\"].keys())", "id": "b9100eeaecc2d4a2", "outputs": [ { "data": { "text/plain": [ "3" ] }, "execution_count": 73, "metadata": {}, "output_type": "execute_result" } ], "execution_count": 73 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T03:38:07.798450Z", "start_time": "2025-01-16T03:38:07.794257Z" } }, "cell_type": "code", "source": "list(db[\"goa_human\"].keys())", "id": "1d15de57619b4e7b", "outputs": [ { "data": { "text/plain": [ "['2024-11-03', '2024-06-10', '2020-01-01']" ] }, "execution_count": 74, "metadata": {}, "output_type": "execute_result" } ], "execution_count": 74 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T06:51:21.735705Z", "start_time": "2025-01-16T06:51:13.328317Z" } }, "cell_type": "code", "source": [ "#ix = differ.changes_by_terms(db[\"goa_human\"][LATEST], db[\"goa_human\"][PREVIOUS[0]], min_num_entities_changes=10, cache={})\n", "grp = \"sgd\"\n", "ix = differ.changes_by_terms(db[grp][PREVIOUS[0]], db[grp][LATEST], min_num_entities_changes=2, cache={})\n" ], "id": "dea16c8833b92aaf", "outputs": [], "execution_count": 89 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T06:51:21.756133Z", "start_time": "2025-01-16T06:51:21.751127Z" } }, "cell_type": "code", "source": "len(ix)", "id": "1295df44a5e49396", "outputs": [ { "data": { "text/plain": [ "847" ] }, "execution_count": 90, "metadata": {}, "output_type": "execute_result" } ], "execution_count": 90 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T06:51:38.169273Z", "start_time": "2025-01-16T06:51:38.161271Z" } }, "cell_type": "code", "source": [ "for k in list(ix.keys())[0:5]:\n", " print(k, go.label(k))" ], "id": "c52a32e82439ffb2", "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "GO:1904688 regulation of cytoplasmic translational initiation\n", "GO:0170039 proteinogenic amino acid metabolic process\n", "GO:0005980 glycogen catabolic process\n", "GO:0045937 positive regulation of phosphate metabolic process\n", "GO:0042762 regulation of sulfur metabolic process\n" ] } ], "execution_count": 91 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T06:51:54.175669Z", "start_time": "2025-01-16T06:51:54.171142Z" } }, "cell_type": "code", "source": "pubmed_adapter = get_adapter(\"pubmed:\")", "id": "acf63844088ab185", "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "WARNING:eutils._internal.queryservice:No NCBI API key provided; throttling to 3 requests/second; see https://ncbiinsights.ncbi.nlm.nih.gov/2017/11/02/new-api-keys-for-the-e-utilities/\n" ] } ], "execution_count": 92 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T06:52:10.167483Z", "start_time": "2025-01-16T06:52:10.164456Z" } }, "cell_type": "code", "source": [ "from functools import lru_cache\n", "\n", "\n", "@lru_cache\n", "def pub_date(pmid):\n", " m = pubmed_adapter.entity_metadata_map(pmid)\n", " if m:\n", " return m.get(\"year\")\n" ], "id": "f6b5935b55ce15ca", "outputs": [], "execution_count": 93 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T08:38:03.124949Z", "start_time": "2025-01-16T08:38:03.114051Z" } }, "cell_type": "code", "source": [ "from typing import Optional\n", "from oaklib.utilities.associations.association_differ import TermComparison\n", "\n", "\n", "def score_term_comparison(term: str, ix: TermComparison, max_date_inclusive=None, max_genes=20) -> Optional[dict]:\n", " \"\"\"\n", " We are interested in genes for which all evidence was from previously known.\n", " \n", " :param term: \n", " :param ix: \n", " :return: \n", " \"\"\"\n", " #all_genes = set(ix.old_associations_by_entity.keys()).union(ix.new_associations_by_entity.keys())\n", " #gene_diff = all_genes - set(ix.old_associations_by_entity.keys()).intersection(ix.new_associations_by_entity.keys())\n", " if len(ix.new_associations_by_entity) > max_genes:\n", " return None\n", " new_genes = set(ix.new_associations_by_entity.keys()) - set(ix.old_associations_by_entity.keys())\n", " gene_id_to_label_map = {}\n", " for g, assocs in ix.new_associations_by_entity.items():\n", " gene_id_to_label_map[g] = assocs[0].subject_label\n", " for g, assocs in ix.old_associations_by_entity.items():\n", " gene_id_to_label_map[g] = assocs[0].subject_label\n", " filtered_new_genes = {}\n", " for gene in new_genes:\n", " all_before_cutoff = True\n", " for a in ix.new_associations_by_entity[gene]:\n", " pmids = [x for x in a.publications if x.startswith(\"PMID\")]\n", " if max_date_inclusive is not None:\n", " # print(f\"{term} {gene}, pmids={pmids}\")\n", " if not pmids:\n", " all_before_cutoff = False\n", " else:\n", " pmid = pmids[0]\n", " date = pub_date(pmid)\n", " if date is None or date > max_date_inclusive:\n", " all_before_cutoff = False\n", " if all_before_cutoff:\n", " filtered_new_genes[gene] = ix.new_associations_by_entity[gene]\n", " #gene_id_diff = len(gene_diff)\n", " term_lbl = go.label(term)\n", " if term in mf_terms:\n", " ann_pred = \"that are capable of\"\n", " elif term in bp_terms:\n", " ann_pred = \"involved in\"\n", " elif term in cc_terms:\n", " ann_pred = \"localized to\"\n", " else:\n", " return\n", " def as_genes_list(amap):\n", " return [gene_id_to_label_map[g] for g in amap]\n", " def as_str_list(amap):\n", " return [str(g) for g in amap]\n", " case = {\n", " \"input\": f\"List all genes {ann_pred} {term_lbl}\",\n", " \"ideal\": \"; \".join(as_genes_list(ix.new_associations_by_entity)),\n", " \"original_input\": {\n", " \"term\": str(term),\n", " \"genes_current\": as_str_list(ix.new_associations_by_entity),\n", " \"genes_previous\": as_str_list(ix.old_associations_by_entity),\n", " \"genes_added\": as_genes_list(new_genes),\n", " \"genes_added_prior_to_cutoff\": as_genes_list(filtered_new_genes),\n", " \"num_genes_added_prior_to_cutoff\": len(filtered_new_genes),\n", " \"date_cutoff\": max_date_inclusive,\n", " }\n", " }\n", " return case" ], "id": "8415d4ef59e1c228", "outputs": [], "execution_count": 110 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-16T08:38:20.387476Z", "start_time": "2025-01-16T08:38:20.116376Z" } }, "cell_type": "code", "source": [ "import yaml\n", "\n", "n = 0\n", "for k in list(ix.keys()):\n", " lbl = go.label(k)\n", " if \"regulation\" in lbl:\n", " continue\n", " if \"response to\" in lbl:\n", " continue\n", " case = score_term_comparison(k, ix[k], max_date_inclusive=\"2022\")\n", " if not case:\n", " continue\n", " if case[\"original_input\"][\"num_genes_added_prior_to_cutoff\"] > 2:\n", " print(yaml.dump(case, sort_keys=False))\n", " n += 1\n", " if n > 40:\n", " break" ], "id": "af913da8d3c2a149", "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "input: List all genes localized to respiratory chain complex IV\n", "ideal: COX6; COX12; COX5B; COX9; COX5A; COX4; COX8; MTC3; COX13; COX7; COX1; COX2;\n", " COX3; COX26; AI4; AI5_ALPHA; AI3\n", "original_input:\n", " term: GO:0045277\n", " genes_current:\n", " - SGD:S000001093\n", " - SGD:S000004028\n", " - SGD:S000001373\n", " - SGD:S000002225\n", " - SGD:S000004997\n", " - SGD:S000003155\n", " - SGD:S000004387\n", " - SGD:S000003195\n", " - SGD:S000003159\n", " - SGD:S000004869\n", " - SGD:S000007260\n", " - SGD:S000007281\n", " - SGD:S000007283\n", " - SGD:S000113555\n", " - SGD:S000007264\n", " - SGD:S000007265\n", " - SGD:S000007263\n", " genes_previous:\n", " - SGD:S000004387\n", " - SGD:S000004028\n", " - SGD:S000004857\n", " - SGD:S000007260\n", " genes_added:\n", " - COX26\n", " - COX13\n", " - AI4\n", " - COX4\n", " - COX9\n", " - AI3\n", " - MTC3\n", " - COX6\n", " - COX3\n", " - AI5_ALPHA\n", " - COX5A\n", " - COX5B\n", " - COX7\n", " - COX2\n", " genes_added_prior_to_cutoff:\n", " - COX26\n", " - COX9\n", " - COX3\n", " - COX7\n", " - COX2\n", " num_genes_added_prior_to_cutoff: 5\n", " date_cutoff: '2022'\n", "\n", "input: List all genes localized to TTT Hsp90 cochaperone complex\n", "ideal: TTI2; RVB2; TRA1; TTI1; RVB1; ASA1; TEL2\n", "original_input:\n", " term: GO:0110078\n", " genes_current:\n", " - SGD:S000003897\n", " - SGD:S000006156\n", " - SGD:S000001141\n", " - SGD:S000001516\n", " - SGD:S000002598\n", " - SGD:S000006289\n", " - SGD:S000003331\n", " genes_previous:\n", " - SGD:S000003897\n", " genes_added:\n", " - RVB1\n", " - TEL2\n", " - TTI1\n", " - ASA1\n", " - RVB2\n", " - TRA1\n", " genes_added_prior_to_cutoff:\n", " - RVB1\n", " - TEL2\n", " - TTI1\n", " - ASA1\n", " - RVB2\n", " - TRA1\n", " num_genes_added_prior_to_cutoff: 6\n", " date_cutoff: '2022'\n", "\n", "input: List all genes localized to respiratory chain complex III\n", "ideal: COR1; RIP1; QCR6; QCR8; QCR7; QCR9; QCR10; CYT1; QCR2; COB\n", "original_input:\n", " term: GO:0045275\n", " genes_current:\n", " - SGD:S000000141\n", " - SGD:S000000750\n", " - SGD:S000001929\n", " - SGD:S000003702\n", " - SGD:S000002937\n", " - SGD:S000003415\n", " - SGD:S000003529\n", " - SGD:S000005591\n", " - SGD:S000006395\n", " - SGD:S000007270\n", " genes_previous:\n", " - SGD:S000007270\n", " genes_added:\n", " - QCR10\n", " - COR1\n", " - CYT1\n", " - QCR2\n", " - QCR9\n", " - QCR8\n", " - QCR6\n", " - QCR7\n", " - RIP1\n", " genes_added_prior_to_cutoff:\n", " - QCR10\n", " - COR1\n", " - QCR2\n", " num_genes_added_prior_to_cutoff: 3\n", " date_cutoff: '2022'\n", "\n", "input: List all genes that are capable of alpha-1,4-glucosidase activity\n", "ideal: MAL62; MAL42; MAL22; MAL32; GTB1; MAL12; IMA1; IMA2; IMA3; IMA4; IMA5\n", "original_input:\n", " term: GO:0004558\n", " genes_current:\n", " - SGD:S000029690\n", " - SGD:S000029687\n", " - SGD:S000029682\n", " - SGD:S000000503\n", " - SGD:S000002629\n", " - SGD:S000003524\n", " - SGD:S000003519\n", " - SGD:S000005517\n", " - SGD:S000001434\n", " - SGD:S000003757\n", " - SGD:S000003752\n", " genes_previous:\n", " - SGD:S000002629\n", " genes_added:\n", " - MAL42\n", " - IMA1\n", " - IMA3\n", " - IMA4\n", " - IMA5\n", " - IMA2\n", " - MAL22\n", " - MAL32\n", " - MAL62\n", " - MAL12\n", " genes_added_prior_to_cutoff:\n", " - MAL42\n", " - MAL22\n", " - MAL62\n", " num_genes_added_prior_to_cutoff: 3\n", " date_cutoff: '2022'\n", "\n", "input: List all genes that are capable of G-quadruplex DNA binding\n", "ideal: RAP1; MGS1; SUB1; DNA2; NSR1; VID22; MSS116; XRS2; SLX9; PIF1; MRE11; DBP2;\n", " RAD50; DED1; DBP1; RRM3\n", "original_input:\n", " term: GO:0051880\n", " genes_current:\n", " - SGD:S000005160\n", " - SGD:S000005162\n", " - SGD:S000004642\n", " - SGD:S000001207\n", " - SGD:S000003391\n", " - SGD:S000004365\n", " - SGD:S000002602\n", " - SGD:S000002777\n", " - SGD:S000003313\n", " - SGD:S000004526\n", " - SGD:S000004837\n", " - SGD:S000005056\n", " - SGD:S000005194\n", " - SGD:S000005730\n", " - SGD:S000006040\n", " - SGD:S000001073\n", " genes_previous:\n", " - SGD:S000004526\n", " - SGD:S000005160\n", " - SGD:S000005194\n", " - SGD:S000004837\n", " - SGD:S000002777\n", " - SGD:S000005162\n", " - SGD:S000004642\n", " - SGD:S000001207\n", " - SGD:S000003391\n", " - SGD:S000003313\n", " - SGD:S000001073\n", " - SGD:S000004365\n", " genes_added:\n", " - DBP2\n", " - MSS116\n", " - DED1\n", " - DBP1\n", " genes_added_prior_to_cutoff:\n", " - DBP2\n", " - MSS116\n", " - DED1\n", " - DBP1\n", " num_genes_added_prior_to_cutoff: 4\n", " date_cutoff: '2022'\n", "\n", "input: List all genes that are capable of alpha-glucosidase activity\n", "ideal: MAL62; MAL42; MAL22; ROT2; MAL32; SGA1; IMA4; IMA3; GTB1; CWH41; MAL12; IMA1;\n", " IMA5; GDB1; IMA2; YMR196W; STA1; CPX-417; SUC2\n", "original_input:\n", " term: GO:0090599\n", " genes_current:\n", " - SGD:S000029690\n", " - SGD:S000029687\n", " - SGD:S000029682\n", " - SGD:S000000433\n", " - SGD:S000000503\n", " - SGD:S000001361\n", " - SGD:S000003757\n", " - SGD:S000001434\n", " - SGD:S000002629\n", " - SGD:S000002995\n", " - SGD:S000003524\n", " - SGD:S000003519\n", " - SGD:S000003752\n", " - SGD:S000006388\n", " - SGD:S000005517\n", " - SGD:S000004809\n", " - SGD:S000029522\n", " - SGD:S000217621\n", " - SGD:S000001424\n", " genes_previous:\n", " - SGD:S000001361\n", " - SGD:S000001434\n", " - SGD:S000003757\n", " - SGD:S000000433\n", " - SGD:S000000503\n", " - SGD:S000003752\n", " - SGD:S000002995\n", " - SGD:S000003519\n", " - SGD:S000003524\n", " - SGD:S000002629\n", " - SGD:S000006388\n", " - SGD:S000005517\n", " - SGD:S000004809\n", " - SGD:S000029522\n", " - SGD:S000217621\n", " - SGD:S000001424\n", " genes_added:\n", " - MAL42\n", " - MAL22\n", " - MAL62\n", " genes_added_prior_to_cutoff:\n", " - MAL42\n", " - MAL22\n", " - MAL62\n", " num_genes_added_prior_to_cutoff: 3\n", " date_cutoff: '2022'\n", "\n" ] } ], "execution_count": 111 }, { "metadata": {}, "cell_type": "code", "outputs": [], "execution_count": null, "source": "", "id": "e56adcfa23306224" }, { "metadata": {}, "cell_type": "code", "outputs": [], "execution_count": null, "source": "", "id": "2a6846e7f9900ffd" }, { "metadata": {}, "cell_type": "code", "outputs": [], "execution_count": null, "source": "", "id": "bd2bfcfb2ee8ba69" }, { "metadata": {}, "cell_type": "code", "outputs": [], "execution_count": null, "source": "", "id": "bb928d0ff338adff" }, { "metadata": {}, "cell_type": "markdown", "source": "## OLD ANALYSIS BELOW", "id": "8103fbec8c035bf5" }, { "metadata": {}, "cell_type": "code", "outputs": [], "execution_count": null, "source": "", "id": "f06ea434d4133a25" }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-06T01:24:34.655429Z", "start_time": "2025-01-06T01:24:34.650696Z" } }, "cell_type": "code", "source": [ "from functools import lru_cache\n", "\n", "\n", "\n", "@lru_cache\n", "def lineage(t: str):\n", " up = set(go.ancestors(t, predicates=[IS_A, PART_OF], reflexive=True))\n", " dn = set(go.descendants(t, predicates=[IS_A, PART_OF]))\n", " return up.union(dn)\n", "\n", "#len(lineage(\"GO:0005737\"))\n", "\n", "@lru_cache\n", "def ancs(t: str):\n", " return set(go.ancestors(t, predicates=[IS_A, PART_OF], reflexive=True))\n", " " ], "id": "899161951deb3a20", "outputs": [], "execution_count": 289 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-06T01:24:48.377611Z", "start_time": "2025-01-06T01:24:48.370515Z" } }, "cell_type": "code", "source": [ "import pandas as pd\n", "\n", "def pmid(a):\n", " pubs = [p for p in a.publications if p.startswith(\"PMID\")]\n", " if pubs:\n", " if len(pubs) > 1:\n", " raise ValueError(f\"Multiple PMIDs: {pubs}\")\n", " return pubs[0]\n", " return None\n", "\n", "@lru_cache\n", "def lbl(t: str):\n", " return go.label(t)\n", "\n", "def assocs_to_df(assocs: list, release: str):\n", " \n", " df = pd.DataFrame([{\n", " \"subject\": a.subject,\n", " \"subject_label\": a.subject_label,\n", " \"predicate\": a.predicate,\n", " \"object\": a.object,\n", " \"object_label\": lbl(a.object),\n", " \"object_obsoletes\": a.object in obsoletes,\n", " \"object_uninformative\": a.object in non_informative,\n", " \"object_closure\": ancs(a.object),\n", " \"object_closure_redundant\": ancs(a.object) - {a.object},\n", " \"evidence\": a.evidence_type,\n", " \"is_iba\": a.evidence_type == \"IBA\",\n", " \"negated\": a.negated,\n", " \"pmid\": pmid(a),\n", " \"pubs\": a.publications,\n", " \"release\": release,\n", " } for a in assocs])\n", " return df" ], "id": "8aae919788e4f995", "outputs": [], "execution_count": 290 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-06T01:29:30.373325Z", "start_time": "2025-01-06T01:25:01.988051Z" } }, "cell_type": "code", "source": [ "human_df = assocs_to_df(db[\"goa_human\"][LATEST], LATEST)\n", "tair_df = assocs_to_df(db[\"tair\"][LATEST], LATEST)\n", "sgd_df = assocs_to_df(db[\"sgd\"][LATEST], LATEST)\n", "df = sgd_df" ], "id": "6a647db06b35a07", "outputs": [], "execution_count": 291 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-06T01:30:21.920341Z", "start_time": "2025-01-06T01:29:44.689297Z" } }, "cell_type": "code", "source": "prev_df = assocs_to_df(db[\"sgd\"][PREVIOUS[-1]], PREVIOUS[-1])", "id": "c14a72ef574e29ce", "outputs": [], "execution_count": 292 }, { "metadata": { "ExecuteTime": { "end_time": "2025-01-06T01:30:36.207477Z", "start_time": "2025-01-06T01:30:36.191544Z" } }, "cell_type": "code", "source": "df", "id": "2fbff3c4fea8f6b6", "outputs": [ { "data": { "text/plain": [ " subject subject_label predicate object \\\n", "0 SGD:S000003381 GPC1 acts_upstream_of_or_within GO:0090640 \n", "1 SGD:S000005701 ALE1 acts_upstream_of_or_within GO:0090640 \n", "2 SGD:S000003381 GPC1 acts_upstream_of_or_within GO:0036151 \n", "3 SGD:S000004492 RCF1 acts_upstream_of_or_within GO:0033617 \n", "4 SGD:S000004977 SIW14 enables GO:0052845 \n", "... ... ... ... ... \n", "120818 SGD:S000003241 SEC9 involved_in GO:0006906 \n", "120819 SGD:S000004826 CEF1 part_of GO:0000974 \n", "120820 SGD:S000002551 MKC7 involved_in GO:0031505 \n", "120821 SGD:S000003008 HEM2 is_active_in GO:0005829 \n", "120822 SGD:S000001122 LAM4 involved_in GO:0032366 \n", "\n", " object_label object_obsoletes \\\n", "0 phosphatidylcholine biosynthesis from sn-glyce... False \n", "1 phosphatidylcholine biosynthesis from sn-glyce... False \n", "2 phosphatidylcholine acyl-chain remodeling False \n", "3 mitochondrial cytochrome c oxidase assembly False \n", "4 inositol-5-diphosphate-1,2,3,4,6-pentakisphosp... False \n", "... ... ... \n", "120818 vesicle fusion False \n", "120819 Prp19 complex False \n", "120820 fungal-type cell wall organization False \n", "120821 cytosol False \n", "120822 intracellular sterol transport False \n", "\n", " object_uninformative \\\n", "0 False \n", "1 False \n", "2 False \n", "3 False \n", "4 False \n", "... ... \n", "120818 False \n", "120819 False \n", "120820 False \n", "120821 False \n", "120822 False \n", "\n", " object_closure \\\n", "0 {GO:0019637, GO:0008152, BFO:0000015, GO:00066... \n", "1 {GO:0019637, GO:0008152, BFO:0000015, GO:00066... \n", "2 {GO:0019637, GO:0008152, GO:0006796, BFO:00000... \n", "3 {GO:0043933, GO:0044085, GO:0065003, GO:001604... \n", "4 {GO:0016817, GO:0016818, GO:0052842, GO:000382... \n", "... ... \n", "120818 {GO:0048284, GO:0051234, GO:0090174, GO:001604... \n", "120819 {GO:0000974, BFO:0000004, BFO:0000040, BFO:000... \n", "120820 {GO:0071554, GO:0016043, GO:0045229, GO:003150... \n", "120821 {CARO:0030000, UBERON:0000061, CARO:0000003, G... \n", "120822 {GO:0006869, GO:0015850, GO:0032365, GO:005123... \n", "\n", " object_closure_redundant evidence is_iba \\\n", "0 {GO:0019637, GO:0008152, GO:0006796, BFO:00000... IGI False \n", "1 {GO:0019637, GO:0008152, GO:0006796, BFO:00000... IGI False \n", "2 {GO:0019637, GO:0008152, GO:0006796, BFO:00000... IMP False \n", "3 {GO:0043933, GO:0044085, GO:0022607, GO:007184... IMP False \n", "4 {GO:0016817, GO:0016818, GO:0052842, GO:000382... IDA False \n", "... ... ... ... \n", "120818 {GO:0061024, BFO:0000015, GO:0009987, GO:00160... IBA True \n", "120819 {BFO:0000004, BFO:0000040, BFO:0000002, GO:003... IBA True \n", "120820 {GO:0071554, GO:0016043, GO:0045229, GO:000998... IBA True \n", "120821 {CARO:0030000, CARO:0000000, BFO:0000004, GO:0... IBA True \n", "120822 {GO:0032365, GO:0015918, GO:0051649, GO:000998... IBA True \n", "\n", " negated pmid pubs release \n", "0 None PMID:30514764 [PMID:30514764] 2024-11-03 \n", "1 None PMID:30514764 [PMID:30514764] 2024-11-03 \n", "2 None PMID:30514764 [PMID:30514764] 2024-11-03 \n", "3 None PMID:29746825 [PMID:29746825] 2024-11-03 \n", "4 None PMID:26828065 [PMID:26828065] 2024-11-03 \n", "... ... ... ... ... \n", "120818 None None [GO_REF:0000033] 2024-11-03 \n", "120819 None None [GO_REF:0000033] 2024-11-03 \n", "120820 None None [GO_REF:0000033] 2024-11-03 \n", "120821 None None [GO_REF:0000033] 2024-11-03 \n", "120822 None None [GO_REF:0000033] 2024-11-03 \n", "\n", "[120823 rows x 15 columns]" ], "text/html": [ "
\n", " | subject | \n", "subject_label | \n", "predicate | \n", "object | \n", "object_label | \n", "object_obsoletes | \n", "object_uninformative | \n", "object_closure | \n", "object_closure_redundant | \n", "evidence | \n", "is_iba | \n", "negated | \n", "pmid | \n", "pubs | \n", "release | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "SGD:S000003381 | \n", "GPC1 | \n", "acts_upstream_of_or_within | \n", "GO:0090640 | \n", "phosphatidylcholine biosynthesis from sn-glyce... | \n", "False | \n", "False | \n", "{GO:0019637, GO:0008152, BFO:0000015, GO:00066... | \n", "{GO:0019637, GO:0008152, GO:0006796, BFO:00000... | \n", "IGI | \n", "False | \n", "None | \n", "PMID:30514764 | \n", "[PMID:30514764] | \n", "2024-11-03 | \n", "
1 | \n", "SGD:S000005701 | \n", "ALE1 | \n", "acts_upstream_of_or_within | \n", "GO:0090640 | \n", "phosphatidylcholine biosynthesis from sn-glyce... | \n", "False | \n", "False | \n", "{GO:0019637, GO:0008152, BFO:0000015, GO:00066... | \n", "{GO:0019637, GO:0008152, GO:0006796, BFO:00000... | \n", "IGI | \n", "False | \n", "None | \n", "PMID:30514764 | \n", "[PMID:30514764] | \n", "2024-11-03 | \n", "
2 | \n", "SGD:S000003381 | \n", "GPC1 | \n", "acts_upstream_of_or_within | \n", "GO:0036151 | \n", "phosphatidylcholine acyl-chain remodeling | \n", "False | \n", "False | \n", "{GO:0019637, GO:0008152, GO:0006796, BFO:00000... | \n", "{GO:0019637, GO:0008152, GO:0006796, BFO:00000... | \n", "IMP | \n", "False | \n", "None | \n", "PMID:30514764 | \n", "[PMID:30514764] | \n", "2024-11-03 | \n", "
3 | \n", "SGD:S000004492 | \n", "RCF1 | \n", "acts_upstream_of_or_within | \n", "GO:0033617 | \n", "mitochondrial cytochrome c oxidase assembly | \n", "False | \n", "False | \n", "{GO:0043933, GO:0044085, GO:0065003, GO:001604... | \n", "{GO:0043933, GO:0044085, GO:0022607, GO:007184... | \n", "IMP | \n", "False | \n", "None | \n", "PMID:29746825 | \n", "[PMID:29746825] | \n", "2024-11-03 | \n", "
4 | \n", "SGD:S000004977 | \n", "SIW14 | \n", "enables | \n", "GO:0052845 | \n", "inositol-5-diphosphate-1,2,3,4,6-pentakisphosp... | \n", "False | \n", "False | \n", "{GO:0016817, GO:0016818, GO:0052842, GO:000382... | \n", "{GO:0016817, GO:0016818, GO:0052842, GO:000382... | \n", "IDA | \n", "False | \n", "None | \n", "PMID:26828065 | \n", "[PMID:26828065] | \n", "2024-11-03 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
120818 | \n", "SGD:S000003241 | \n", "SEC9 | \n", "involved_in | \n", "GO:0006906 | \n", "vesicle fusion | \n", "False | \n", "False | \n", "{GO:0048284, GO:0051234, GO:0090174, GO:001604... | \n", "{GO:0061024, BFO:0000015, GO:0009987, GO:00160... | \n", "IBA | \n", "True | \n", "None | \n", "None | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "
120819 | \n", "SGD:S000004826 | \n", "CEF1 | \n", "part_of | \n", "GO:0000974 | \n", "Prp19 complex | \n", "False | \n", "False | \n", "{GO:0000974, BFO:0000004, BFO:0000040, BFO:000... | \n", "{BFO:0000004, BFO:0000040, BFO:0000002, GO:003... | \n", "IBA | \n", "True | \n", "None | \n", "None | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "
120820 | \n", "SGD:S000002551 | \n", "MKC7 | \n", "involved_in | \n", "GO:0031505 | \n", "fungal-type cell wall organization | \n", "False | \n", "False | \n", "{GO:0071554, GO:0016043, GO:0045229, GO:003150... | \n", "{GO:0071554, GO:0016043, GO:0045229, GO:000998... | \n", "IBA | \n", "True | \n", "None | \n", "None | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "
120821 | \n", "SGD:S000003008 | \n", "HEM2 | \n", "is_active_in | \n", "GO:0005829 | \n", "cytosol | \n", "False | \n", "False | \n", "{CARO:0030000, UBERON:0000061, CARO:0000003, G... | \n", "{CARO:0030000, CARO:0000000, BFO:0000004, GO:0... | \n", "IBA | \n", "True | \n", "None | \n", "None | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "
120822 | \n", "SGD:S000001122 | \n", "LAM4 | \n", "involved_in | \n", "GO:0032366 | \n", "intracellular sterol transport | \n", "False | \n", "False | \n", "{GO:0006869, GO:0015850, GO:0032365, GO:005123... | \n", "{GO:0032365, GO:0015918, GO:0051649, GO:000998... | \n", "IBA | \n", "True | \n", "None | \n", "None | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "
120823 rows × 15 columns
\n", "\n", " | subject | \n", "subject_label | \n", "predicate | \n", "object | \n", "object_label | \n", "object_obsoletes | \n", "object_uninformative | \n", "object_closure | \n", "object_closure_redundant | \n", "evidence | \n", "is_iba | \n", "negated | \n", "pmid | \n", "pubs | \n", "release | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "AGI_LocusCode:AT1G11880 | \n", "AT1G11880 | \n", "enables | \n", "GO:0000009 | \n", "alpha-1,6-mannosyltransferase activity | \n", "False | \n", "False | \n", "{GO:0000030, GO:0003824, GO:0016740, BFO:00000... | \n", "{GO:0000030, GO:0003824, GO:0016740, BFO:00000... | \n", "IEA | \n", "False | \n", "None | \n", "None | \n", "[TAIR:AnalysisReference:501756966] | \n", "2024-11-03 | \n", "
1 | \n", "AGI_LocusCode:AT1G80420 | \n", "ATXRCC1 | \n", "involved_in | \n", "GO:0000012 | \n", "single strand break repair | \n", "False | \n", "False | \n", "{GO:0043170, GO:0033554, GO:0008152, GO:000613... | \n", "{GO:0043170, GO:0008152, BFO:0000015, GO:00099... | \n", "IEA | \n", "False | \n", "None | \n", "None | \n", "[TAIR:AnalysisReference:501756966] | \n", "2024-11-03 | \n", "
2 | \n", "AGI_LocusCode:AT1G74030 | \n", "ENO1 | \n", "part_of | \n", "GO:0000015 | \n", "phosphopyruvate hydratase complex | \n", "False | \n", "False | \n", "{GO:0005829, GO:0110165, BFO:0000002, GO:00329... | \n", "{CARO:0030000, GO:0005829, BFO:0000004, CARO:0... | \n", "IEA | \n", "False | \n", "None | \n", "None | \n", "[TAIR:AnalysisReference:501756966] | \n", "2024-11-03 | \n", "
3 | \n", "AGI_LocusCode:AT2G29560 | \n", "ENOC | \n", "part_of | \n", "GO:0000015 | \n", "phosphopyruvate hydratase complex | \n", "False | \n", "False | \n", "{GO:0005829, GO:0110165, BFO:0000002, GO:00329... | \n", "{CARO:0030000, GO:0005829, BFO:0000004, CARO:0... | \n", "IEA | \n", "False | \n", "None | \n", "None | \n", "[TAIR:AnalysisReference:501756966] | \n", "2024-11-03 | \n", "
4 | \n", "AGI_LocusCode:AT2G36530 | \n", "LOS2 | \n", "part_of | \n", "GO:0000015 | \n", "phosphopyruvate hydratase complex | \n", "False | \n", "False | \n", "{GO:0005829, GO:0110165, BFO:0000002, GO:00329... | \n", "{CARO:0030000, GO:0005829, BFO:0000004, CARO:0... | \n", "IEA | \n", "False | \n", "None | \n", "None | \n", "[TAIR:AnalysisReference:501756966] | \n", "2024-11-03 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
235366 | \n", "TAIR:locus:2058630 | \n", "At2g23210 | \n", "enables | \n", "GO:0010294 | \n", "abscisic acid glucosyltransferase activity | \n", "False | \n", "False | \n", "{GO:0035251, GO:0003824, GO:0016740, BFO:00000... | \n", "{GO:0035251, GO:0003824, GO:0016740, BFO:00000... | \n", "IBA | \n", "True | \n", "None | \n", "None | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "
235367 | \n", "AGI_LocusCode:AT2G15820 | \n", "OTP51 | \n", "involved_in | \n", "GO:0045292 | \n", "mRNA cis splicing, via spliceosome | \n", "False | \n", "False | \n", "{GO:0006397, GO:0008152, GO:0000375, BFO:00000... | \n", "{GO:0009059, GO:0043170, GO:0006397, GO:000815... | \n", "IBA | \n", "True | \n", "None | \n", "None | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "
235368 | \n", "TAIR:locus:2143196 | \n", "At5g15750 | \n", "involved_in | \n", "GO:0042274 | \n", "ribosomal small subunit biogenesis | \n", "False | \n", "False | \n", "{GO:0042274, GO:0044085, GO:0009987, BFO:00000... | \n", "{GO:0044085, GO:0009987, BFO:0000015, GO:00226... | \n", "IBA | \n", "True | \n", "None | \n", "None | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "
235369 | \n", "AGI_LocusCode:AT4G14730 | \n", "LFG1 | \n", "is_active_in | \n", "GO:0016020 | \n", "membrane | \n", "False | \n", "False | \n", "{CARO:0030000, UBERON:0000061, CARO:0000003, G... | \n", "{CARO:0030000, UBERON:0000061, CARO:0000003, G... | \n", "IBA | \n", "True | \n", "None | \n", "None | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "
235370 | \n", "TAIR:locus:2116525 | \n", "SD25 | \n", "enables | \n", "GO:0004672 | \n", "protein kinase activity | \n", "False | \n", "False | \n", "{GO:0140096, GO:0003824, GO:0016740, BFO:00000... | \n", "{GO:0140096, GO:0003824, GO:0016740, BFO:00000... | \n", "IBA | \n", "True | \n", "None | \n", "None | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "
235371 rows × 15 columns
\n", "\n", " | subject | \n", "subject_label | \n", "predicate | \n", "object | \n", "object_label | \n", "object_obsoletes | \n", "object_uninformative | \n", "object_closure | \n", "object_closure_redundant | \n", "evidence | \n", "is_iba | \n", "negated | \n", "pmid | \n", "pubs | \n", "release | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
56871 | \n", "AGI_LocusCode:AT5G62620 | \n", "GALT6 | \n", "located_in | \n", "GO:0005794 | \n", "Golgi apparatus | \n", "False | \n", "False | \n", "{GO:0110165, GO:0043231, BFO:0000002, GO:00057... | \n", "{CARO:0030000, CARO:0000000, BFO:0000004, GO:0... | \n", "ISM | \n", "False | \n", "None | \n", "None | \n", "[TAIR:AnalysisReference:501780126] | \n", "2024-11-03 | \n", "
56872 | \n", "AGI_LocusCode:AT5G62620 | \n", "GALT6 | \n", "located_in | \n", "GO:0005794 | \n", "Golgi apparatus | \n", "False | \n", "False | \n", "{GO:0110165, GO:0043231, BFO:0000002, GO:00057... | \n", "{CARO:0030000, CARO:0000000, BFO:0000004, GO:0... | \n", "ISM | \n", "False | \n", "None | \n", "None | \n", "[TAIR:AnalysisReference:501780126] | \n", "2024-11-03 | \n", "
61144 | \n", "AGI_LocusCode:AT5G62620 | \n", "GALT6 | \n", "involved_in | \n", "GO:0006486 | \n", "protein glycosylation | \n", "False | \n", "False | \n", "{GO:0008152, BFO:0000015, GO:0009100, GO:00434... | \n", "{GO:0009059, GO:0043170, GO:0070085, GO:000815... | \n", "IEA | \n", "False | \n", "None | \n", "None | \n", "[TAIR:AnalysisReference:501757242] | \n", "2024-11-03 | \n", "
85487 | \n", "AGI_LocusCode:AT5G62620 | \n", "GALT6 | \n", "enables | \n", "GO:0030246 | \n", "carbohydrate binding | \n", "False | \n", "True | \n", "{BFO:0000015, GO:0003674, GO:0005488, BFO:0000... | \n", "{GO:0003674, BFO:0000015, GO:0005488, BFO:0000... | \n", "IEA | \n", "False | \n", "None | \n", "None | \n", "[TAIR:AnalysisReference:501756966] | \n", "2024-11-03 | \n", "
165846 | \n", "AGI_LocusCode:AT5G62620 | \n", "GALT6 | \n", "located_in | \n", "GO:0005794 | \n", "Golgi apparatus | \n", "False | \n", "False | \n", "{GO:0110165, GO:0043231, BFO:0000002, GO:00057... | \n", "{CARO:0030000, CARO:0000000, BFO:0000004, GO:0... | \n", "IDA | \n", "False | \n", "None | \n", "PMID:26690932 | \n", "[TAIR:Publication:501767599, PMID:26690932] | \n", "2024-11-03 | \n", "
165851 | \n", "AGI_LocusCode:AT5G62620 | \n", "GALT6 | \n", "involved_in | \n", "GO:0010405 | \n", "arabinogalactan protein metabolic process | \n", "False | \n", "False | \n", "{GO:0043170, GO:0044036, GO:0010384, GO:007155... | \n", "{GO:0043170, GO:0044036, GO:0071554, GO:000815... | \n", "IMP | \n", "False | \n", "None | \n", "PMID:26690932 | \n", "[TAIR:Publication:501767599, PMID:26690932] | \n", "2024-11-03 | \n", "
165856 | \n", "AGI_LocusCode:AT5G62620 | \n", "GALT6 | \n", "involved_in | \n", "GO:0018258 | \n", "protein O-linked glycosylation via hydroxyproline | \n", "False | \n", "False | \n", "{GO:0006493, GO:0008152, BFO:0000015, GO:00091... | \n", "{GO:0009059, GO:0006493, GO:0043170, GO:007008... | \n", "IDA | \n", "False | \n", "None | \n", "PMID:26690932 | \n", "[TAIR:Publication:501767599, PMID:26690932] | \n", "2024-11-03 | \n", "
165858 | \n", "AGI_LocusCode:AT5G62620 | \n", "GALT6 | \n", "acts_upstream_of_or_within | \n", "GO:0048354 | \n", "mucilage biosynthetic process involved in seed... | \n", "False | \n", "False | \n", "{GO:0032501, GO:0008152, GO:0048359, BFO:00000... | \n", "{GO:0032501, GO:0010192, GO:0008152, GO:004835... | \n", "IMP | \n", "False | \n", "None | \n", "PMID:26690932 | \n", "[TAIR:Publication:501767599, PMID:26690932] | \n", "2024-11-03 | \n", "
165863 | \n", "AGI_LocusCode:AT5G62620 | \n", "GALT6 | \n", "acts_upstream_of_or_within | \n", "GO:1900056 | \n", "negative regulation of leaf senescence | \n", "False | \n", "False | \n", "{GO:0065007, BFO:0000015, GO:1900055, GO:00485... | \n", "{GO:0065007, BFO:0000015, GO:1900055, GO:00485... | \n", "IMP | \n", "False | \n", "None | \n", "PMID:26690932 | \n", "[TAIR:Publication:501767599, PMID:26690932] | \n", "2024-11-03 | \n", "
165869 | \n", "AGI_LocusCode:AT5G62620 | \n", "GALT6 | \n", "enables | \n", "GO:1990714 | \n", "hydroxyproline O-galactosyltransferase activity | \n", "False | \n", "False | \n", "{GO:0003824, GO:0016740, BFO:0000015, GO:00083... | \n", "{GO:0003824, GO:0016740, BFO:0000015, GO:00083... | \n", "IDA | \n", "False | \n", "None | \n", "PMID:26690932 | \n", "[TAIR:Publication:501767599, PMID:26690932] | \n", "2024-11-03 | \n", "
210076 | \n", "AGI_LocusCode:AT5G62620 | \n", "GALT6 | \n", "enables | \n", "GO:1990714 | \n", "hydroxyproline O-galactosyltransferase activity | \n", "False | \n", "False | \n", "{GO:0003824, GO:0016740, BFO:0000015, GO:00083... | \n", "{GO:0003824, GO:0016740, BFO:0000015, GO:00083... | \n", "IBA | \n", "True | \n", "None | \n", "None | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "
217996 | \n", "AGI_LocusCode:AT5G62620 | \n", "GALT6 | \n", "is_active_in | \n", "GO:0000139 | \n", "Golgi membrane | \n", "False | \n", "False | \n", "{GO:0110165, GO:0043231, BFO:0000002, GO:00057... | \n", "{CARO:0030000, GO:0005794, CARO:0000000, BFO:0... | \n", "IBA | \n", "True | \n", "None | \n", "None | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "
\n", " | subject | \n", "terms | \n", "n_iba | \n", "n_negated | \n", "closure | \n", "object_closure_redundant | \n", "n_pmid | \n", "release | \n", "
---|---|---|---|---|---|---|---|---|
0 | \n", "SGD:S000000001 | \n", "{GO:0071168, GO:0005739, GO:0008301, GO:000367... | \n", "3 | \n", "0 | \n", "{GO:0005739, GO:0000182, GO:0008152, BFO:00000... | \n", "{GO:0000182, GO:0008152, BFO:0000015, GO:00010... | \n", "{PMID:2404611, PMID:18708580, PMID:2649882, PM... | \n", "2024-11-03 | \n", "
1 | \n", "SGD:S000000002 | \n", "{GO:0015031, GO:0099023, GO:0005768, GO:000662... | \n", "4 | \n", "0 | \n", "{GO:0032509, GO:0071985, GO:0046872, BFO:00000... | \n", "{GO:0032509, GO:0071985, GO:0046872, BFO:00000... | \n", "{PMID:19828734, PMID:30358795, PMID:20173035, ... | \n", "2024-11-03 | \n", "
2 | \n", "SGD:S000000003 | \n", "{GO:0005085, GO:0005737, GO:0032232, GO:000582... | \n", "3 | \n", "0 | \n", "{GO:0005085, GO:0030234, GO:0008152, BFO:00000... | \n", "{GO:0030234, GO:0008152, BFO:0000015, GO:00900... | \n", "{PMID:19545407, PMID:10409717, PMID:17925388, ... | \n", "2024-11-03 | \n", "
3 | \n", "SGD:S000000004 | \n", "{GO:0005829, GO:0072671, GO:0005576, GO:003460... | \n", "9 | \n", "0 | \n", "{GO:1901363, GO:0003723, GO:0008152, BFO:00000... | \n", "{GO:1901363, GO:0003723, GO:0008152, BFO:00000... | \n", "{PMID:18706386, PMID:9789005, PMID:26928762, P... | \n", "2024-11-03 | \n", "
4 | \n", "SGD:S000000005 | \n", "{GO:0015031, GO:0006621, GO:0005789, GO:000688... | \n", "8 | \n", "0 | \n", "{BFO:0000015, GO:0030135, GO:0070972, GO:01101... | \n", "{BFO:0000015, GO:0030135, GO:0070972, GO:01101... | \n", "{PMID:26928762, PMID:10359606, None, PMID:1115... | \n", "2024-11-03 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
6906 | \n", "SGD:S000350095 | \n", "{GO:0008150, GO:0003674, GO:0005575} | \n", "0 | \n", "0 | \n", "{BFO:0000003, BFO:0000015, BFO:0000004, GO:000... | \n", "{BFO:0000004, BFO:0000040, BFO:0000003, BFO:00... | \n", "{None} | \n", "2024-11-03 | \n", "
6907 | \n", "SGD:S000350096 | \n", "{GO:0008150, GO:0003674, GO:0005575} | \n", "0 | \n", "0 | \n", "{BFO:0000003, BFO:0000015, BFO:0000004, GO:000... | \n", "{BFO:0000004, BFO:0000040, BFO:0000003, BFO:00... | \n", "{None} | \n", "2024-11-03 | \n", "
6908 | \n", "SGD:S000350097 | \n", "{GO:0005575, GO:0003674, GO:0008150} | \n", "0 | \n", "0 | \n", "{BFO:0000004, BFO:0000002, GO:0003674, GO:0008... | \n", "{BFO:0000004, BFO:0000002, BFO:0000003, BFO:00... | \n", "{None} | \n", "2024-11-03 | \n", "
6909 | \n", "SGD:S000350098 | \n", "{GO:0005575, GO:0003674, GO:0008150} | \n", "0 | \n", "0 | \n", "{BFO:0000004, BFO:0000002, GO:0003674, GO:0008... | \n", "{BFO:0000004, BFO:0000002, BFO:0000003, BFO:00... | \n", "{None} | \n", "2024-11-03 | \n", "
6910 | \n", "SGD:S000350099 | \n", "{GO:0003674, GO:0005575, GO:0008150} | \n", "0 | \n", "0 | \n", "{BFO:0000040, BFO:0000015, BFO:0000004, GO:000... | \n", "{BFO:0000004, BFO:0000002, BFO:0000003, BFO:00... | \n", "{None} | \n", "2024-11-03 | \n", "
6911 rows × 8 columns
\n", "\n", " | subject | \n", "subject_label | \n", "predicate | \n", "object | \n", "object_label | \n", "object_obsoletes | \n", "object_uninformative | \n", "object_closure | \n", "object_closure_redundant | \n", "evidence | \n", "is_iba | \n", "negated | \n", "pmid | \n", "pubs | \n", "release | \n", "redundant | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
16 | \n", "SGD:S000004539 | \n", "FPR3 | \n", "located_in | \n", "GO:0005634 | \n", "nucleus | \n", "False | \n", "False | \n", "{GO:0110165, GO:0043231, BFO:0000002, GO:00432... | \n", "{CARO:0030000, CARO:0000000, BFO:0000004, GO:0... | \n", "IDA | \n", "False | \n", "None | \n", "PMID:26359986 | \n", "[PMID:26359986] | \n", "2024-11-03 | \n", "True | \n", "
28 | \n", "SGD:S000002699 | \n", "HRQ1 | \n", "enables | \n", "GO:0043138 | \n", "3'-5' DNA helicase activity | \n", "False | \n", "False | \n", "{BFO:0000015, GO:0008150, GO:0016043, GO:00431... | \n", "{GO:0140097, GO:0032508, GO:0003824, BFO:00000... | \n", "IDA | \n", "False | \n", "None | \n", "PMID:28385527 | \n", "[PMID:28385527] | \n", "2024-11-03 | \n", "True | \n", "
33 | \n", "SGD:S000002699 | \n", "HRQ1 | \n", "enables | \n", "GO:0043138 | \n", "3'-5' DNA helicase activity | \n", "False | \n", "False | \n", "{BFO:0000015, GO:0008150, GO:0016043, GO:00431... | \n", "{GO:0140097, GO:0032508, GO:0003824, BFO:00000... | \n", "IDA | \n", "False | \n", "None | \n", "PMID:24440721 | \n", "[PMID:24440721] | \n", "2024-11-03 | \n", "True | \n", "
39 | \n", "SGD:S000003245 | \n", "SNU71 | \n", "located_in | \n", "GO:0005634 | \n", "nucleus | \n", "False | \n", "False | \n", "{GO:0110165, GO:0043231, BFO:0000002, GO:00432... | \n", "{CARO:0030000, CARO:0000000, BFO:0000004, GO:0... | \n", "IEA | \n", "False | \n", "None | \n", "None | \n", "[GO_REF:0000043] | \n", "2024-11-03 | \n", "True | \n", "
42 | \n", "SGD:S000001443 | \n", "DJP1 | \n", "acts_upstream_of_or_within | \n", "GO:0006626 | \n", "protein targeting to mitochondrion | \n", "False | \n", "False | \n", "{GO:0070585, GO:0051234, GO:0006605, GO:007072... | \n", "{GO:0070585, GO:0070727, GO:0033365, BFO:00000... | \n", "IMP | \n", "False | \n", "None | \n", "PMID:30213914 | \n", "[PMID:30213914] | \n", "2024-11-03 | \n", "True | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
105624 | \n", "SGD:S000006483 | \n", "RDN18-2 | \n", "located_in | \n", "GO:0005840 | \n", "ribosome | \n", "False | \n", "False | \n", "{GO:0110165, BFO:0000002, GO:0043229, CL:00000... | \n", "{CARO:0030000, CARO:0000000, BFO:0000004, GO:0... | \n", "IEA | \n", "False | \n", "None | \n", "PMID:30502926 | \n", "[PMID:30502926] | \n", "2024-11-03 | \n", "True | \n", "
105625 | \n", "SGD:S000006502 | \n", "SNR42 | \n", "located_in | \n", "GO:0005730 | \n", "nucleolus | \n", "False | \n", "False | \n", "{GO:0043233, GO:0043231, GO:0110165, BFO:00000... | \n", "{CARO:0030000, GO:0005634, CARO:0000000, BFO:0... | \n", "IEA | \n", "False | \n", "None | \n", "PMID:30502926 | \n", "[PMID:30502926] | \n", "2024-11-03 | \n", "True | \n", "
105627 | \n", "SGD:S000007300 | \n", "SNR36 | \n", "located_in | \n", "GO:0005730 | \n", "nucleolus | \n", "False | \n", "False | \n", "{GO:0043233, GO:0043231, GO:0110165, BFO:00000... | \n", "{CARO:0030000, GO:0005634, CARO:0000000, BFO:0... | \n", "IEA | \n", "False | \n", "None | \n", "PMID:30502926 | \n", "[PMID:30502926] | \n", "2024-11-03 | \n", "True | \n", "
105628 | \n", "SGD:S000006484 | \n", "RDN25-1 | \n", "located_in | \n", "GO:0005840 | \n", "ribosome | \n", "False | \n", "False | \n", "{GO:0110165, BFO:0000002, GO:0043229, CL:00000... | \n", "{CARO:0030000, CARO:0000000, BFO:0000004, GO:0... | \n", "IEA | \n", "False | \n", "None | \n", "PMID:30502926 | \n", "[PMID:30502926] | \n", "2024-11-03 | \n", "True | \n", "
105629 | \n", "SGD:S000006485 | \n", "RDN25-2 | \n", "located_in | \n", "GO:0005840 | \n", "ribosome | \n", "False | \n", "False | \n", "{GO:0110165, BFO:0000002, GO:0043229, CL:00000... | \n", "{CARO:0030000, CARO:0000000, BFO:0000004, GO:0... | \n", "IEA | \n", "False | \n", "None | \n", "PMID:30502926 | \n", "[PMID:30502926] | \n", "2024-11-03 | \n", "True | \n", "
34441 rows × 16 columns
\n", "\n", " | subject | \n", "subject_label | \n", "predicate | \n", "object | \n", "object_label | \n", "object_obsoletes | \n", "object_uninformative | \n", "object_closure | \n", "object_closure_redundant | \n", "evidence | \n", "is_iba | \n", "negated | \n", "pmid | \n", "pubs | \n", "release | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "UniProtKB:A0A024RBG1 | \n", "NUDT4B | \n", "enables | \n", "GO:0003723 | \n", "RNA binding | \n", "False | \n", "True | \n", "{GO:0097159, GO:0003723, BFO:0000015, GO:00036... | \n", "{GO:0097159, BFO:0000015, GO:0003674, GO:00036... | \n", "IEA | \n", "False | \n", "None | \n", "None | \n", "[GO_REF:0000043] | \n", "2024-11-03 | \n", "
1 | \n", "UniProtKB:A0A024RBG1 | \n", "NUDT4B | \n", "enables | \n", "GO:0005515 | \n", "protein binding | \n", "False | \n", "True | \n", "{BFO:0000015, GO:0003674, GO:0005488, BFO:0000... | \n", "{GO:0003674, BFO:0000015, GO:0005488, BFO:0000... | \n", "IPI | \n", "False | \n", "None | \n", "PMID:33961781 | \n", "[PMID:33961781] | \n", "2024-11-03 | \n", "
2 | \n", "UniProtKB:A0A024RBG1 | \n", "NUDT4B | \n", "enables | \n", "GO:0046872 | \n", "metal ion binding | \n", "False | \n", "True | \n", "{GO:0043169, GO:0046872, BFO:0000015, GO:00360... | \n", "{GO:0043169, BFO:0000015, GO:0036094, GO:00431... | \n", "IEA | \n", "False | \n", "None | \n", "None | \n", "[GO_REF:0000043] | \n", "2024-11-03 | \n", "
3 | \n", "UniProtKB:A0A024RBG1 | \n", "NUDT4B | \n", "located_in | \n", "GO:0005829 | \n", "cytosol | \n", "False | \n", "False | \n", "{CARO:0030000, UBERON:0000061, CARO:0000003, G... | \n", "{CARO:0030000, CARO:0000000, BFO:0000004, GO:0... | \n", "IDA | \n", "False | \n", "None | \n", "None | \n", "[GO_REF:0000052] | \n", "2024-11-03 | \n", "
4 | \n", "UniProtKB:A0A075B6H5 | \n", "TRBV20OR9-2 | \n", "involved_in | \n", "GO:0002376 | \n", "immune system process | \n", "False | \n", "False | \n", "{GO:0008150, BFO:0000015, GO:0002376, BFO:0000... | \n", "{BFO:0000015, GO:0008150, BFO:0000003} | \n", "IEA | \n", "False | \n", "None | \n", "None | \n", "[GO_REF:0000043] | \n", "2024-11-03 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
782818 | \n", "UniProtKB:Q9NZC2 | \n", "TREM2 | \n", "involved_in | \n", "GO:0045088 | \n", "regulation of innate immune response | \n", "False | \n", "False | \n", "{GO:0065007, GO:0002682, GO:0050776, BFO:00000... | \n", "{GO:0065007, GO:0002682, GO:0050776, BFO:00000... | \n", "IBA | \n", "True | \n", "None | \n", "None | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "
782819 | \n", "UniProtKB:Q9Y2K2 | \n", "SIK3 | \n", "enables | \n", "GO:0050321 | \n", "tau-protein kinase activity | \n", "False | \n", "False | \n", "{GO:0140096, GO:0003824, GO:0004674, GO:001674... | \n", "{GO:0140096, GO:0003824, GO:0004674, GO:001674... | \n", "IBA | \n", "True | \n", "None | \n", "None | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "
782820 | \n", "UniProtKB:P43235 | \n", "CTSK | \n", "involved_in | \n", "GO:0051603 | \n", "proteolysis involved in protein catabolic process | \n", "False | \n", "False | \n", "{GO:0043170, GO:0006508, GO:0044238, GO:000905... | \n", "{GO:0043170, GO:0006508, GO:0044238, GO:000905... | \n", "IBA | \n", "True | \n", "None | \n", "None | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "
782821 | \n", "UniProtKB:Q07343 | \n", "PDE4B | \n", "enables | \n", "GO:0047555 | \n", "3',5'-cyclic-GMP phosphodiesterase activity | \n", "False | \n", "False | \n", "{GO:0047555, GO:0003824, GO:0008081, BFO:00000... | \n", "{GO:0003824, GO:0008081, BFO:0000015, GO:00425... | \n", "IBA | \n", "True | \n", "None | \n", "None | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "
782822 | \n", "UniProtKB:A6NC42 | \n", "DPPA5 | \n", "involved_in | \n", "GO:0010468 | \n", "regulation of gene expression | \n", "False | \n", "False | \n", "{GO:0065007, GO:0060255, GO:0009889, BFO:00000... | \n", "{GO:0065007, GO:0060255, GO:0009889, BFO:00000... | \n", "IBA | \n", "True | \n", "None | \n", "None | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "
782823 rows × 15 columns
\n", "\n", " | subject | \n", "subject_label | \n", "predicate | \n", "object | \n", "object_label | \n", "object_obsoletes | \n", "object_uninformative | \n", "object_closure | \n", "object_closure_redundant | \n", "evidence | \n", "... | \n", "pubs | \n", "release | \n", "pmid_new | \n", "is_new | \n", "fresh | \n", "pmid_removed | \n", "unique | \n", "redacted | \n", "redundant | \n", "iba_rejected | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "UniProtKB:A0A024RBG1 | \n", "NUDT4B | \n", "enables | \n", "GO:0003723 | \n", "RNA binding | \n", "False | \n", "True | \n", "{GO:0097159, GO:0003723, BFO:0000015, GO:00036... | \n", "{GO:0097159, BFO:0000015, GO:0003674, GO:00036... | \n", "IEA | \n", "... | \n", "[GO_REF:0000043] | \n", "2024-11-03 | \n", "False | \n", "False | \n", "False | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "True | \n", "
1 | \n", "UniProtKB:A0A024RBG1 | \n", "NUDT4B | \n", "enables | \n", "GO:0005515 | \n", "protein binding | \n", "False | \n", "True | \n", "{BFO:0000015, GO:0003674, GO:0005488, BFO:0000... | \n", "{GO:0003674, BFO:0000015, GO:0005488, BFO:0000... | \n", "IPI | \n", "... | \n", "[PMID:33961781] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "True | \n", "
2 | \n", "UniProtKB:A0A024RBG1 | \n", "NUDT4B | \n", "enables | \n", "GO:0046872 | \n", "metal ion binding | \n", "False | \n", "True | \n", "{GO:0043169, GO:0046872, BFO:0000015, GO:00360... | \n", "{GO:0043169, BFO:0000015, GO:0036094, GO:00431... | \n", "IEA | \n", "... | \n", "[GO_REF:0000043] | \n", "2024-11-03 | \n", "False | \n", "False | \n", "False | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "True | \n", "
3 | \n", "UniProtKB:A0A024RBG1 | \n", "NUDT4B | \n", "located_in | \n", "GO:0005829 | \n", "cytosol | \n", "False | \n", "False | \n", "{CARO:0030000, UBERON:0000061, CARO:0000003, G... | \n", "{CARO:0030000, CARO:0000000, BFO:0000004, GO:0... | \n", "IDA | \n", "... | \n", "[GO_REF:0000052] | \n", "2024-11-03 | \n", "False | \n", "False | \n", "False | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "True | \n", "
4 | \n", "UniProtKB:A0A075B6H5 | \n", "TRBV20OR9-2 | \n", "involved_in | \n", "GO:0002376 | \n", "immune system process | \n", "False | \n", "False | \n", "{GO:0008150, BFO:0000015, GO:0002376, BFO:0000... | \n", "{BFO:0000015, GO:0008150, BFO:0000003} | \n", "IEA | \n", "... | \n", "[GO_REF:0000043] | \n", "2024-11-03 | \n", "False | \n", "True | \n", "False | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "True | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
434570 | \n", "UniProtKB:Q9Y6A4 | \n", "CFAP20 | \n", "None | \n", "GO:0007275 | \n", "multicellular organism development | \n", "False | \n", "True | \n", "{GO:0032501, BFO:0000015, GO:0048856, GO:00325... | \n", "{GO:0032501, BFO:0000015, GO:0048856, GO:00325... | \n", "TAS | \n", "... | \n", "[PMID:8688464] | \n", "2020-01-01 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "True | \n", "True | \n", "True | \n", "False | \n", "True | \n", "
435058 | \n", "UniProtKB:Q9Y6F1 | \n", "PARP3 | \n", "None | \n", "GO:0006281 | \n", "DNA repair | \n", "False | \n", "False | \n", "{GO:0043170, GO:0033554, GO:0008152, GO:000613... | \n", "{GO:0043170, GO:0008152, BFO:0000015, GO:00099... | \n", "TAS | \n", "... | \n", "[PMID:7260241] | \n", "2020-01-01 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "True | \n", "True | \n", "True | \n", "True | \n", "False | \n", "
436209 | \n", "UniProtKB:Q9Y6Q9 | \n", "NCOA3 | \n", "None | \n", "GO:0000981 | \n", "DNA-binding transcription factor activity, RNA... | \n", "False | \n", "False | \n", "{BFO:0000015, GO:0006357, GO:0008150, GO:00192... | \n", "{GO:0065007, GO:0060255, GO:0009889, BFO:00000... | \n", "ISM | \n", "... | \n", "[PMID:19274049] | \n", "2020-01-01 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "True | \n", "True | \n", "True | \n", "False | \n", "True | \n", "
436550 | \n", "UniProtKB:Q9Y6X0 | \n", "SETBP1 | \n", "None | \n", "GO:0000981 | \n", "DNA-binding transcription factor activity, RNA... | \n", "False | \n", "False | \n", "{BFO:0000015, GO:0006357, GO:0008150, GO:00192... | \n", "{GO:0065007, GO:0060255, GO:0009889, BFO:00000... | \n", "ISM | \n", "... | \n", "[PMID:19274049] | \n", "2020-01-01 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "True | \n", "True | \n", "True | \n", "False | \n", "True | \n", "
436732 | \n", "UniProtKB:Q9Y6Y1 | \n", "CAMTA1 | \n", "None | \n", "GO:0000981 | \n", "DNA-binding transcription factor activity, RNA... | \n", "False | \n", "False | \n", "{BFO:0000015, GO:0006357, GO:0008150, GO:00192... | \n", "{GO:0065007, GO:0060255, GO:0009889, BFO:00000... | \n", "ISM | \n", "... | \n", "[PMID:19274049] | \n", "2020-01-01 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "True | \n", "True | \n", "True | \n", "False | \n", "True | \n", "
783918 rows × 23 columns
\n", "\n", " | subject | \n", "subject_label | \n", "predicate | \n", "object | \n", "object_label | \n", "object_obsoletes | \n", "object_uninformative | \n", "object_closure | \n", "object_closure_redundant | \n", "evidence | \n", "... | \n", "pubs | \n", "release | \n", "pmid_new | \n", "is_new | \n", "fresh | \n", "pmid_removed | \n", "unique | \n", "redacted | \n", "redundant | \n", "iba_rejected | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "UniProtKB:A0A024RBG1 | \n", "NUDT4B | \n", "enables | \n", "GO:0003723 | \n", "RNA binding | \n", "False | \n", "True | \n", "{GO:0097159, GO:0003723, BFO:0000015, GO:00036... | \n", "{GO:0097159, BFO:0000015, GO:0003674, GO:00036... | \n", "IEA | \n", "... | \n", "[GO_REF:0000043] | \n", "2024-11-03 | \n", "False | \n", "False | \n", "False | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "True | \n", "
1 | \n", "UniProtKB:A0A024RBG1 | \n", "NUDT4B | \n", "enables | \n", "GO:0005515 | \n", "protein binding | \n", "False | \n", "True | \n", "{BFO:0000015, GO:0003674, GO:0005488, BFO:0000... | \n", "{GO:0003674, BFO:0000015, GO:0005488, BFO:0000... | \n", "IPI | \n", "... | \n", "[PMID:33961781] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "True | \n", "
2 | \n", "UniProtKB:A0A024RBG1 | \n", "NUDT4B | \n", "enables | \n", "GO:0046872 | \n", "metal ion binding | \n", "False | \n", "True | \n", "{GO:0043169, GO:0046872, BFO:0000015, GO:00360... | \n", "{GO:0043169, BFO:0000015, GO:0036094, GO:00431... | \n", "IEA | \n", "... | \n", "[GO_REF:0000043] | \n", "2024-11-03 | \n", "False | \n", "False | \n", "False | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "True | \n", "
3 | \n", "UniProtKB:A0A024RBG1 | \n", "NUDT4B | \n", "located_in | \n", "GO:0005829 | \n", "cytosol | \n", "False | \n", "False | \n", "{CARO:0030000, UBERON:0000061, CARO:0000003, G... | \n", "{CARO:0030000, CARO:0000000, BFO:0000004, GO:0... | \n", "IDA | \n", "... | \n", "[GO_REF:0000052] | \n", "2024-11-03 | \n", "False | \n", "False | \n", "False | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "True | \n", "
4 | \n", "UniProtKB:A0A075B6H5 | \n", "TRBV20OR9-2 | \n", "involved_in | \n", "GO:0002376 | \n", "immune system process | \n", "False | \n", "False | \n", "{GO:0008150, BFO:0000015, GO:0002376, BFO:0000... | \n", "{BFO:0000015, GO:0008150, BFO:0000003} | \n", "IEA | \n", "... | \n", "[GO_REF:0000043] | \n", "2024-11-03 | \n", "False | \n", "True | \n", "False | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "True | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
433680 | \n", "UniProtKB:Q9Y5Y6 | \n", "ST14 | \n", "None | \n", "GO:0005887 | \n", "None | \n", "True | \n", "False | \n", "{GO:0005887} | \n", "{} | \n", "TAS | \n", "... | \n", "[PMID:10831593] | \n", "2020-01-01 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "True | \n", "True | \n", "True | \n", "False | \n", "True | \n", "
434570 | \n", "UniProtKB:Q9Y6A4 | \n", "CFAP20 | \n", "None | \n", "GO:0007275 | \n", "multicellular organism development | \n", "False | \n", "True | \n", "{GO:0032501, BFO:0000015, GO:0048856, GO:00325... | \n", "{GO:0032501, BFO:0000015, GO:0048856, GO:00325... | \n", "TAS | \n", "... | \n", "[PMID:8688464] | \n", "2020-01-01 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "True | \n", "True | \n", "True | \n", "False | \n", "True | \n", "
436209 | \n", "UniProtKB:Q9Y6Q9 | \n", "NCOA3 | \n", "None | \n", "GO:0000981 | \n", "DNA-binding transcription factor activity, RNA... | \n", "False | \n", "False | \n", "{BFO:0000015, GO:0006357, GO:0008150, GO:00192... | \n", "{GO:0065007, GO:0060255, GO:0009889, BFO:00000... | \n", "ISM | \n", "... | \n", "[PMID:19274049] | \n", "2020-01-01 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "True | \n", "True | \n", "True | \n", "False | \n", "True | \n", "
436550 | \n", "UniProtKB:Q9Y6X0 | \n", "SETBP1 | \n", "None | \n", "GO:0000981 | \n", "DNA-binding transcription factor activity, RNA... | \n", "False | \n", "False | \n", "{BFO:0000015, GO:0006357, GO:0008150, GO:00192... | \n", "{GO:0065007, GO:0060255, GO:0009889, BFO:00000... | \n", "ISM | \n", "... | \n", "[PMID:19274049] | \n", "2020-01-01 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "True | \n", "True | \n", "True | \n", "False | \n", "True | \n", "
436732 | \n", "UniProtKB:Q9Y6Y1 | \n", "CAMTA1 | \n", "None | \n", "GO:0000981 | \n", "DNA-binding transcription factor activity, RNA... | \n", "False | \n", "False | \n", "{BFO:0000015, GO:0006357, GO:0008150, GO:00192... | \n", "{GO:0065007, GO:0060255, GO:0009889, BFO:00000... | \n", "ISM | \n", "... | \n", "[PMID:19274049] | \n", "2020-01-01 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "True | \n", "True | \n", "True | \n", "False | \n", "True | \n", "
450057 rows × 23 columns
\n", "\n", " | subject | \n", "subject_label | \n", "predicate | \n", "object | \n", "object_label | \n", "object_obsoletes | \n", "object_uninformative | \n", "object_closure | \n", "object_closure_redundant | \n", "evidence | \n", "is_iba | \n", "negated | \n", "pmid | \n", "pubs | \n", "release | \n", "pmid_new | \n", "is_new | \n", "fresh | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
1 | \n", "UniProtKB:A0A024RBG1 | \n", "NUDT4B | \n", "enables | \n", "GO:0005515 | \n", "protein binding | \n", "False | \n", "True | \n", "{BFO:0000015, GO:0003674, GO:0005488, BFO:0000... | \n", "{GO:0003674, BFO:0000015, GO:0005488, BFO:0000... | \n", "IPI | \n", "False | \n", "None | \n", "PMID:33961781 | \n", "[PMID:33961781] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "
357 | \n", "UniProtKB:A0A096LP55 | \n", "UQCRHL | \n", "located_in | \n", "GO:0005739 | \n", "mitochondrion | \n", "False | \n", "False | \n", "{GO:0005739, GO:0110165, GO:0043231, BFO:00000... | \n", "{CARO:0030000, CARO:0000000, BFO:0000004, GO:0... | \n", "HTP | \n", "False | \n", "None | \n", "PMID:34800366 | \n", "[PMID:34800366] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "
569 | \n", "UniProtKB:A0A0B4J2F0 | \n", "PIGBOS1 | \n", "located_in | \n", "GO:0005739 | \n", "mitochondrion | \n", "False | \n", "False | \n", "{GO:0005739, GO:0110165, GO:0043231, BFO:00000... | \n", "{CARO:0030000, CARO:0000000, BFO:0000004, GO:0... | \n", "HTP | \n", "False | \n", "None | \n", "PMID:34800366 | \n", "[PMID:34800366] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "
1904 | \n", "UniProtKB:A1A4Y4 | \n", "IRGM | \n", "enables | \n", "GO:1901612 | \n", "cardiolipin binding | \n", "False | \n", "True | \n", "{GO:0008289, GO:0043168, GO:1901612, BFO:00000... | \n", "{GO:0008289, GO:0043168, BFO:0000015, GO:00360... | \n", "IDA | \n", "False | \n", "None | \n", "PMID:21102437 | \n", "[PMID:21102437] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "
1945 | \n", "UniProtKB:A1A4Y4 | \n", "IRGM | \n", "involved_in | \n", "GO:0090141 | \n", "positive regulation of mitochondrial fission | \n", "False | \n", "False | \n", "{GO:0010821, GO:0051130, GO:0065007, GO:003304... | \n", "{GO:0010821, GO:0051130, GO:0065007, GO:003304... | \n", "IDA | \n", "False | \n", "None | \n", "PMID:21102437 | \n", "[PMID:21102437] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
718365 | \n", "RNAcentral:URS00026A23F2_9606 | \n", "URS00026A23F2_9606 | \n", "enables | \n", "GO:0141180 | \n", "dsDNA-RNA triple helix-forming chromatin adapt... | \n", "False | \n", "True | \n", "{GO:0030674, BFO:0000015, GO:0043565, GO:00036... | \n", "{GO:0003690, GO:0030674, GO:0003677, GO:007184... | \n", "IDA | \n", "False | \n", "None | \n", "PMID:27634931 | \n", "[PMID:27634931] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "
718366 | \n", "RNAcentral:URS00026A23F2_9606 | \n", "URS00026A23F2_9606 | \n", "involved_in | \n", "GO:0000122 | \n", "negative regulation of transcription by RNA po... | \n", "False | \n", "False | \n", "{BFO:0000015, GO:0006357, GO:0008150, GO:00098... | \n", "{GO:0045934, GO:0009892, GO:0065007, GO:000988... | \n", "IMP | \n", "False | \n", "None | \n", "PMID:27634931 | \n", "[PMID:27634931] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "
718367 | \n", "RNAcentral:URS00026A23F2_9606 | \n", "URS00026A23F2_9606 | \n", "involved_in | \n", "GO:0000512 | \n", "lncRNA-mediated post-transcriptional gene sile... | \n", "False | \n", "False | \n", "{GO:0000512, BFO:0000015, GO:0016441, GO:00081... | \n", "{GO:0065007, GO:0009892, GO:0031047, GO:000988... | \n", "IDA | \n", "False | \n", "None | \n", "PMID:30720199 | \n", "[PMID:30720199] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "
718368 | \n", "RNAcentral:URS00026A23F2_9606 | \n", "URS00026A23F2_9606 | \n", "involved_in | \n", "GO:0000512 | \n", "lncRNA-mediated post-transcriptional gene sile... | \n", "False | \n", "False | \n", "{GO:0000512, BFO:0000015, GO:0016441, GO:00081... | \n", "{GO:0065007, GO:0009892, GO:0031047, GO:000988... | \n", "IMP | \n", "False | \n", "None | \n", "PMID:33102210 | \n", "[PMID:33102210] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "
718370 | \n", "RNAcentral:URS00026A23F2_9606 | \n", "URS00026A23F2_9606 | \n", "involved_in | \n", "GO:0090399 | \n", "replicative senescence | \n", "False | \n", "False | \n", "{GO:0008152, BFO:0000015, GO:0090399, GO:00099... | \n", "{GO:0008152, BFO:0000015, GO:0009987, GO:00081... | \n", "IMP | \n", "False | \n", "None | \n", "PMID:27634931 | \n", "[PMID:27634931] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "
3380 rows × 18 columns
\n", "\n", " | subject | \n", "subject_label | \n", "predicate | \n", "object | \n", "object_label | \n", "object_obsoletes | \n", "object_uninformative | \n", "object_closure | \n", "object_closure_redundant | \n", "evidence | \n", "... | \n", "pubs | \n", "release | \n", "pmid_new | \n", "is_new | \n", "fresh | \n", "pmid_removed | \n", "unique | \n", "redacted | \n", "redundant | \n", "iba_rejected | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
4876 | \n", "UniProtKB:A6NNL5 | \n", "C15orf61 | \n", "located_in | \n", "GO:0005739 | \n", "mitochondrion | \n", "False | \n", "False | \n", "{GO:0005739, GO:0110165, GO:0043231, BFO:00000... | \n", "{CARO:0030000, CARO:0000000, BFO:0000004, GO:0... | \n", "HTP | \n", "... | \n", "[PMID:34800366] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "False | \n", "
5853 | \n", "UniProtKB:A8MSI8 | \n", "LYRM9 | \n", "located_in | \n", "GO:0005739 | \n", "mitochondrion | \n", "False | \n", "False | \n", "{GO:0005739, GO:0110165, GO:0043231, BFO:00000... | \n", "{CARO:0030000, CARO:0000000, BFO:0000004, GO:0... | \n", "HTP | \n", "... | \n", "[PMID:34800366] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "False | \n", "
6327 | \n", "UniProtKB:A8MXV4 | \n", "NUDT19 | \n", "located_in | \n", "GO:0005739 | \n", "mitochondrion | \n", "False | \n", "False | \n", "{GO:0005739, GO:0110165, GO:0043231, BFO:00000... | \n", "{CARO:0030000, CARO:0000000, BFO:0000004, GO:0... | \n", "HTP | \n", "... | \n", "[PMID:34800366] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "False | \n", "
15942 | \n", "UniProtKB:O14521 | \n", "SDHD | \n", "part_of | \n", "GO:0045273 | \n", "respiratory chain complex II (succinate dehydr... | \n", "False | \n", "False | \n", "{GO:0098796, GO:0110165, GO:0045273, BFO:00000... | \n", "{CARO:0030000, GO:0098803, GO:0098796, CARO:00... | \n", "IDA | \n", "... | \n", "[PMID:37098072] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "False | \n", "
34482 | \n", "UniProtKB:O43325 | \n", "LYRM1 | \n", "located_in | \n", "GO:0005739 | \n", "mitochondrion | \n", "False | \n", "False | \n", "{GO:0005739, GO:0110165, GO:0043231, BFO:00000... | \n", "{CARO:0030000, CARO:0000000, BFO:0000004, GO:0... | \n", "HTP | \n", "... | \n", "[PMID:34800366] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "False | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
718362 | \n", "RNAcentral:URS00026A23F2_9606 | \n", "URS00026A23F2_9606 | \n", "acts_upstream_of | \n", "GO:0008284 | \n", "positive regulation of cell population prolife... | \n", "False | \n", "False | \n", "{GO:0065007, GO:0042127, GO:0048518, BFO:00000... | \n", "{GO:0065007, GO:0042127, GO:0048518, BFO:00000... | \n", "IMP | \n", "... | \n", "[PMID:33102210] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "False | \n", "
718366 | \n", "RNAcentral:URS00026A23F2_9606 | \n", "URS00026A23F2_9606 | \n", "involved_in | \n", "GO:0000122 | \n", "negative regulation of transcription by RNA po... | \n", "False | \n", "False | \n", "{BFO:0000015, GO:0006357, GO:0008150, GO:00098... | \n", "{GO:0045934, GO:0009892, GO:0065007, GO:000988... | \n", "IMP | \n", "... | \n", "[PMID:27634931] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "False | \n", "
718367 | \n", "RNAcentral:URS00026A23F2_9606 | \n", "URS00026A23F2_9606 | \n", "involved_in | \n", "GO:0000512 | \n", "lncRNA-mediated post-transcriptional gene sile... | \n", "False | \n", "False | \n", "{GO:0000512, BFO:0000015, GO:0016441, GO:00081... | \n", "{GO:0065007, GO:0009892, GO:0031047, GO:000988... | \n", "IDA | \n", "... | \n", "[PMID:30720199] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "False | \n", "
718368 | \n", "RNAcentral:URS00026A23F2_9606 | \n", "URS00026A23F2_9606 | \n", "involved_in | \n", "GO:0000512 | \n", "lncRNA-mediated post-transcriptional gene sile... | \n", "False | \n", "False | \n", "{GO:0000512, BFO:0000015, GO:0016441, GO:00081... | \n", "{GO:0065007, GO:0009892, GO:0031047, GO:000988... | \n", "IMP | \n", "... | \n", "[PMID:33102210] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "False | \n", "
718370 | \n", "RNAcentral:URS00026A23F2_9606 | \n", "URS00026A23F2_9606 | \n", "involved_in | \n", "GO:0090399 | \n", "replicative senescence | \n", "False | \n", "False | \n", "{GO:0008152, BFO:0000015, GO:0090399, GO:00099... | \n", "{GO:0008152, BFO:0000015, GO:0009987, GO:00081... | \n", "IMP | \n", "... | \n", "[PMID:27634931] | \n", "2024-11-03 | \n", "True | \n", "True | \n", "True | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "False | \n", "
524 rows × 23 columns
\n", "\n", " | subject | \n", "subject_label | \n", "predicate | \n", "object | \n", "object_label | \n", "object_obsoletes | \n", "object_uninformative | \n", "object_closure | \n", "object_closure_redundant | \n", "evidence | \n", "... | \n", "pubs | \n", "release | \n", "pmid_new | \n", "is_new | \n", "fresh | \n", "pmid_removed | \n", "unique | \n", "redacted | \n", "redundant | \n", "iba_rejected | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
401144 | \n", "UniProtKB:Q8N6R0 | \n", "METTL13 | \n", "involved_in | \n", "GO:0000122 | \n", "negative regulation of transcription by RNA po... | \n", "False | \n", "False | \n", "{BFO:0000015, GO:0006357, GO:0008150, GO:00098... | \n", "{GO:0045934, GO:0009892, GO:0065007, GO:000988... | \n", "IMP | \n", "... | \n", "[PMID:26763933] | \n", "2024-06-10 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "True | \n", "True | \n", "True | \n", "False | \n", "False | \n", "
401146 | \n", "UniProtKB:Q8N6R0 | \n", "METTL13 | \n", "involved_in | \n", "GO:1902807 | \n", "negative regulation of cell cycle G1/S phase t... | \n", "False | \n", "False | \n", "{GO:0065007, GO:1902806, GO:0010948, GO:190198... | \n", "{GO:0065007, GO:0010948, GO:1901988, GO:005172... | \n", "IMP | \n", "... | \n", "[PMID:26763933] | \n", "2024-06-10 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "True | \n", "True | \n", "True | \n", "False | \n", "False | \n", "
453842 | \n", "UniProtKB:Q96K19 | \n", "RNF170 | \n", "involved_in | \n", "GO:0034140 | \n", "negative regulation of toll-like receptor 3 si... | \n", "False | \n", "False | \n", "{GO:0048585, GO:0062207, GO:1902532, GO:000996... | \n", "{GO:0048585, GO:0065007, GO:0002682, GO:006220... | \n", "IDA | \n", "... | \n", "[PMID:31076723] | \n", "2024-06-10 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "True | \n", "True | \n", "True | \n", "False | \n", "False | \n", "
587451 | \n", "RNAcentral:URS0000083D87_9606 | \n", "URS0000083D87_9606 | \n", "involved_in | \n", "GO:0035195 | \n", "miRNA-mediated post-transcriptional gene silen... | \n", "False | \n", "False | \n", "{BFO:0000015, GO:0016441, GO:0008150, GO:00106... | \n", "{GO:0065007, GO:0009892, GO:0031047, GO:000988... | \n", "IDA | \n", "... | \n", "[PMID:28640956] | \n", "2024-06-10 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "True | \n", "True | \n", "True | \n", "False | \n", "False | \n", "
587452 | \n", "RNAcentral:URS0000083D87_9606 | \n", "URS0000083D87_9606 | \n", "involved_in | \n", "GO:0090051 | \n", "negative regulation of cell migration involved... | \n", "False | \n", "False | \n", "{GO:0030336, BFO:0000015, GO:0008150, GO:00105... | \n", "{GO:0065007, GO:0030336, BFO:0000015, GO:00485... | \n", "IGI | \n", "... | \n", "[PMID:28640956] | \n", "2024-06-10 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "True | \n", "True | \n", "True | \n", "False | \n", "False | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
424250 | \n", "UniProtKB:Q9Y226 | \n", "SLC22A13 | \n", "None | \n", "GO:0015695 | \n", "organic cation transport | \n", "False | \n", "False | \n", "{GO:0051234, GO:0006810, BFO:0000015, GO:00156... | \n", "{GO:0051234, GO:0006810, BFO:0000015, GO:00511... | \n", "NAS | \n", "... | \n", "[PMID:10072596] | \n", "2020-01-01 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "True | \n", "True | \n", "True | \n", "False | \n", "False | \n", "
425053 | \n", "UniProtKB:Q9Y267 | \n", "SLC22A14 | \n", "None | \n", "GO:0005887 | \n", "None | \n", "True | \n", "False | \n", "{GO:0005887} | \n", "{} | \n", "NAS | \n", "... | \n", "[PMID:10072596] | \n", "2020-01-01 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "True | \n", "True | \n", "True | \n", "False | \n", "False | \n", "
425054 | \n", "UniProtKB:Q9Y267 | \n", "SLC22A14 | \n", "None | \n", "GO:0015101 | \n", "organic cation transmembrane transporter activity | \n", "False | \n", "False | \n", "{GO:0051234, GO:0055085, GO:0006810, BFO:00000... | \n", "{GO:0051234, GO:0055085, GO:0006810, BFO:00000... | \n", "NAS | \n", "... | \n", "[PMID:10072596] | \n", "2020-01-01 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "True | \n", "True | \n", "True | \n", "False | \n", "False | \n", "
425055 | \n", "UniProtKB:Q9Y267 | \n", "SLC22A14 | \n", "None | \n", "GO:0015695 | \n", "organic cation transport | \n", "False | \n", "False | \n", "{GO:0051234, GO:0006810, BFO:0000015, GO:00156... | \n", "{GO:0051234, GO:0006810, BFO:0000015, GO:00511... | \n", "NAS | \n", "... | \n", "[PMID:10072596] | \n", "2020-01-01 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "True | \n", "True | \n", "True | \n", "False | \n", "False | \n", "
432681 | \n", "UniProtKB:Q9Y5M6 | \n", "OCLM | \n", "None | \n", "GO:0007601 | \n", "visual perception | \n", "False | \n", "False | \n", "{GO:0032501, GO:0050953, GO:0003008, BFO:00000... | \n", "{GO:0032501, GO:0050953, GO:0003008, BFO:00000... | \n", "TAS | \n", "... | \n", "[PMID:10362512] | \n", "2020-01-01 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "True | \n", "True | \n", "True | \n", "False | \n", "False | \n", "
83 rows × 23 columns
\n", "\n", " | subject | \n", "subject_label | \n", "predicate | \n", "object | \n", "object_label | \n", "object_obsoletes | \n", "object_uninformative | \n", "object_closure | \n", "object_closure_redundant | \n", "evidence | \n", "... | \n", "pubs | \n", "release | \n", "pmid_new | \n", "is_new | \n", "fresh | \n", "pmid_removed | \n", "unique | \n", "redacted | \n", "redundant | \n", "iba_rejected | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
718564 | \n", "UniProtKB:Q06418 | \n", "TYRO3 | \n", "enables | \n", "GO:0004714 | \n", "transmembrane receptor protein tyrosine kinase... | \n", "False | \n", "False | \n", "{GO:0019199, GO:0140096, GO:0003824, GO:001674... | \n", "{GO:0019199, GO:0003824, BFO:0000015, GO:00167... | \n", "IBA | \n", "... | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "False | \n", "False | \n", "False | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "False | \n", "
718565 | \n", "UniProtKB:P78559 | \n", "MAP1A | \n", "is_active_in | \n", "GO:0030425 | \n", "dendrite | \n", "False | \n", "False | \n", "{GO:0030425, GO:0120025, GO:0043005, GO:011016... | \n", "{CARO:0030000, CL:0002319, CL:0000211, UBERON:... | \n", "IBA | \n", "... | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "False | \n", "False | \n", "False | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "False | \n", "
718566 | \n", "UniProtKB:Q7L1W4 | \n", "LRRC8D | \n", "is_active_in | \n", "GO:0005737 | \n", "cytoplasm | \n", "False | \n", "False | \n", "{CARO:0030000, UBERON:0000061, CARO:0000003, G... | \n", "{CARO:0030000, UBERON:0000061, CARO:0000003, C... | \n", "IBA | \n", "... | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "False | \n", "False | \n", "False | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "False | \n", "
718567 | \n", "UniProtKB:A3QJZ7 | \n", "PRAMEF27 | \n", "part_of | \n", "GO:0031462 | \n", "Cul2-RING ubiquitin ligase complex | \n", "False | \n", "False | \n", "{GO:0031462, GO:0031461, GO:1990234, BFO:00000... | \n", "{GO:0031461, GO:1990234, BFO:0000004, GO:01405... | \n", "IBA | \n", "... | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "False | \n", "True | \n", "False | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "False | \n", "
718568 | \n", "UniProtKB:Q70IA6 | \n", "MOB2 | \n", "is_active_in | \n", "GO:0005634 | \n", "nucleus | \n", "False | \n", "False | \n", "{GO:0110165, GO:0043231, BFO:0000002, GO:00432... | \n", "{CARO:0030000, CARO:0000000, BFO:0000004, GO:0... | \n", "IBA | \n", "... | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "False | \n", "False | \n", "False | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "False | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
782818 | \n", "UniProtKB:Q9NZC2 | \n", "TREM2 | \n", "involved_in | \n", "GO:0045088 | \n", "regulation of innate immune response | \n", "False | \n", "False | \n", "{GO:0065007, GO:0002682, GO:0050776, BFO:00000... | \n", "{GO:0065007, GO:0002682, GO:0050776, BFO:00000... | \n", "IBA | \n", "... | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "False | \n", "False | \n", "False | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "False | \n", "
782819 | \n", "UniProtKB:Q9Y2K2 | \n", "SIK3 | \n", "enables | \n", "GO:0050321 | \n", "tau-protein kinase activity | \n", "False | \n", "False | \n", "{GO:0140096, GO:0003824, GO:0004674, GO:001674... | \n", "{GO:0140096, GO:0003824, GO:0004674, GO:001674... | \n", "IBA | \n", "... | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "False | \n", "False | \n", "False | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "False | \n", "
782820 | \n", "UniProtKB:P43235 | \n", "CTSK | \n", "involved_in | \n", "GO:0051603 | \n", "proteolysis involved in protein catabolic process | \n", "False | \n", "False | \n", "{GO:0043170, GO:0006508, GO:0044238, GO:000905... | \n", "{GO:0043170, GO:0006508, GO:0044238, GO:000905... | \n", "IBA | \n", "... | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "False | \n", "False | \n", "False | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "False | \n", "
782821 | \n", "UniProtKB:Q07343 | \n", "PDE4B | \n", "enables | \n", "GO:0047555 | \n", "3',5'-cyclic-GMP phosphodiesterase activity | \n", "False | \n", "False | \n", "{GO:0047555, GO:0003824, GO:0008081, BFO:00000... | \n", "{GO:0003824, GO:0008081, BFO:0000015, GO:00425... | \n", "IBA | \n", "... | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "False | \n", "False | \n", "False | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "False | \n", "
782822 | \n", "UniProtKB:A6NC42 | \n", "DPPA5 | \n", "involved_in | \n", "GO:0010468 | \n", "regulation of gene expression | \n", "False | \n", "False | \n", "{GO:0065007, GO:0060255, GO:0009889, BFO:00000... | \n", "{GO:0065007, GO:0060255, GO:0009889, BFO:00000... | \n", "IBA | \n", "... | \n", "[GO_REF:0000033] | \n", "2024-11-03 | \n", "False | \n", "False | \n", "False | \n", "NaN | \n", "NaN | \n", "NaN | \n", "False | \n", "False | \n", "
56487 rows × 23 columns
\n", "