Query ClinVar for clinical variant significance. Use when user asks about variant pathogenicity, genetic variants, clinical significance, or disease-causing mutations. Triggers on "clinvar", "pathogenic", "variant significance", "clinical significance", "disease variant", "mutation pathogenicity".
Query NCBI ClinVar for clinical significance of genetic variants.
from Bio import Entrez
import json
Entrez.email = "[email protected]"
# 1. Search ClinVar
def search_clinvar(query, max_results=10):
handle = Entrez.esearch(db="clinvar", term=query, retmax=max_results)
record = Entrez.read(handle)
handle.close()
return record
# 2. Fetch variant details
def fetch_clinvar(id_list):
ids = ",".join(str(i) for i in id_list)
handle = Entrez.efetch(db="clinvar", id=ids, rettype="vcv", retmode="xml")
result = handle.read()
handle.close()
return result
# 3. Summary for ClinVar IDs
def clinvar_summary(id_list):
ids = ",".join(str(i) for i in id_list)
handle = Entrez.esummary(db="clinvar", id=ids, retmode="json")
result = json.loads(handle.read())
handle.close()
return result
# Example: Find pathogenic BRCA1 variants
search = search_clinvar("BRCA1[gene] AND clinsig_pathogenic[prop]", max_results=5)
print(f"Total pathogenic BRCA1 variants: {search['Count']}")
if search['IdList']:
summaries = clinvar_summary(search['IdList'])
for uid in search['IdList']:
info = summaries['result'].get(str(uid), {})
title = info.get('title', 'N/A')
clinical_sig = info.get('clinical_significance', {}).get('description', 'N/A')
genes = info.get('genes', [{}])
gene = genes[0].get('symbol', 'N/A') if genes else 'N/A'
print(f"\nVariant: {title}")
print(f"Gene: {gene}")
print(f"Clinical significance: {clinical_sig}")
BRCA1[gene] AND clinsig_pathogenic[prop]rs6025[rsid]"breast cancer"[dis] AND clinsig_pathogenic[prop]17[chr] AND 43000000:44000000[chrpos37]BRCA1[gene] AND origin_germline[prop]