"""
Ensembl REST API Tool
This tool provides access to the Ensembl genome browser database for gene
lookup, sequence retrieval, variant information, and homology data.
"""
import requests
from typing import Dict, Any, Optional
from .base_tool import BaseTool
from .tool_registry import register_tool
[docs]
@register_tool("EnsemblLookupGene")
class EnsemblLookupGene(EnsemblRESTTool):
"""Lookup gene information by ID or symbol."""
[docs]
def __init__(self, tool_config):
super().__init__(tool_config)
self.endpoint = "/lookup/id"
[docs]
def run(self, arguments: Dict[str, Any]) -> Dict[str, Any]:
"""Lookup gene by ID or symbol."""
gene_id = arguments.get("gene_id", "")
if not gene_id:
return {"status": "error", "error": "gene_id is required"}
# Ensembl API requires the ID in the URL path
endpoint = f"{self.endpoint}/{gene_id}"
params = {"expand": 1}
# Add species if specified
if "species" in arguments:
params["species"] = arguments["species"]
result = self._make_request(endpoint, params)
# Add gene_id to result for reference
if result.get("status") == "success":
result["gene_id"] = gene_id
return result
[docs]
@register_tool("EnsemblGetSequence")
class EnsemblGetSequence(EnsemblRESTTool):
"""Get DNA or protein sequences by region or gene ID."""
[docs]
def __init__(self, tool_config):
super().__init__(tool_config)
self.endpoint = "/sequence/id"
[docs]
def run(self, arguments: Dict[str, Any]) -> Dict[str, Any]:
"""Get sequence by gene ID or region."""
sequence_id = arguments.get("sequence_id", "")
if not sequence_id:
return {"status": "error", "error": "sequence_id is required"}
# Ensembl API requires the ID in the URL path
endpoint = f"{self.endpoint}/{sequence_id}"
params = {
"type": arguments.get("type", "genomic"), # genomic, cds, protein
"multiple_sequences": "true",
}
# Add species if specified
if "species" in arguments:
params["species"] = arguments["species"]
result = self._make_request(endpoint, params)
# Add sequence_id to result for reference
if result.get("status") == "success":
result["sequence_id"] = sequence_id
return result
[docs]
@register_tool("EnsemblGetVariants")
class EnsemblGetVariants(EnsemblRESTTool):
"""Get variant information for a genomic region."""
[docs]
def __init__(self, tool_config):
super().__init__(tool_config)
self.endpoint = "/overlap/id"
[docs]
def run(self, arguments: Dict[str, Any]) -> Dict[str, Any]:
"""Get variants for a region."""
region = arguments.get("region", "")
if not region:
return {
"status": "error",
"error": "region is required (e.g., '1:1000000..2000000')",
}
# Ensembl API requires the region in the URL path with species
species = arguments.get("species", "human")
endpoint = f"/overlap/region/{species}/{region}"
params = {"feature": "variation", "content-type": "application/json"}
result = self._make_request(endpoint, params)
# Add region to result for reference
if result.get("status") == "success":
result["region"] = region
return result