diff --git a/data-exploration/direction-of-effect.ipynb b/data-exploration/direction-of-effect.ipynb
index f4705e8..70525d8 100644
--- a/data-exploration/direction-of-effect.ipynb
+++ b/data-exploration/direction-of-effect.ipynb
@@ -207,7 +207,7 @@
},
{
"cell_type": "code",
- "execution_count": null,
+ "execution_count": 245,
"id": "d22115ea-56f6-404d-9839-c91c8ed74a89",
"metadata": {
"pycharm": {
@@ -215,134 +215,6 @@
},
"scrolled": true
},
- "outputs": [],
- "source": [
- "# Looking at the data - output suppressed for brevity\n",
- "var_drug_ann.head()"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": null,
- "id": "12dada29-2a14-4992-acf4-45115aed57d2",
- "metadata": {
- "pycharm": {
- "name": "#%%\n"
- },
- "scrolled": true
- },
- "outputs": [],
- "source": [
- "var_fa_ann.head()"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": null,
- "id": "70537798-e6fb-47f5-8ba2-6859c4b645a2",
- "metadata": {
- "scrolled": true
- },
- "outputs": [],
- "source": [
- "var_pheno_ann.head()"
- ]
- },
- {
- "cell_type": "markdown",
- "id": "3b84a02e-1791-4a6b-8223-d904442ddf7c",
- "metadata": {},
- "source": [
- "The 3 annotations tables provide evidence for the clinical annotations, can be connected by joining with the `clinical_ann_evidence.tsv` file. In general a clinical annotation can have multiple variant annotations as evidence, and a variant annotation can be used as evidence for multiple clinical annotations (in theory, I've not actually observed this).\n",
- "\n",
- "Each of these tables has a \"Direction of effect\" column, and the type of \"effect\" is different for each - likelihood of side effects, formation of product, metabolism of drug, etc.\n",
- "\n",
- "**Question for OT**: when we say \"direction of effect\", do we mean any of these \"effects\"? I.e. should we include all three of these tables or focus on one?"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": 38,
- "id": "d43fd147-43b4-4541-9595-f757da937e60",
- "metadata": {},
- "outputs": [],
- "source": [
- "clinical_annotations = read_tsv_to_df(os.path.join(data_dir, 'clinical_annotations.tsv'))\n",
- "clinical_ann_evidence = read_tsv_to_df(os.path.join(data_dir, 'clinical_ann_evidence.tsv'))\n",
- "clinical_ann_alleles = read_tsv_to_df(os.path.join(data_dir, 'clinical_ann_alleles.tsv'))"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": 122,
- "id": "1a553aac-a9f7-4579-ab7c-05fa6f90ddfe",
- "metadata": {},
- "outputs": [],
- "source": [
- "main_df = pd.merge(clinical_annotations, clinical_ann_evidence, how='left', on=ID_COL_NAME)\n",
- "main_df = main_df[[\n",
- " # Main table\n",
- " 'Clinical Annotation ID', 'Variant/Haplotypes', 'Gene', 'Level of Evidence', 'Phenotype Category', 'Drug(s)', 'Phenotype(s)',\n",
- " # Evidence table\n",
- " 'Evidence ID', 'Evidence Type', 'PMID', 'Summary',\n",
- "]]"
- ]
- },
- {
- "cell_type": "markdown",
- "id": "5945f09b-9516-4d65-ad75-d27a5a1890cf",
- "metadata": {},
- "source": [
- "#### Example clinical annotation\n",
- "\n",
- "[Top of page](#Table-of-contents)\n",
- "\n",
- "Looking at [981755803](https://www.pharmgkb.org/clinicalAnnotation/981755803), which has all three types of variant annotation evidence as well as label/guideline evidence."
- ]
- },
- {
- "cell_type": "code",
- "execution_count": 124,
- "id": "f5bb8c9e-baeb-4ef6-9373-7c38a333601c",
- "metadata": {},
- "outputs": [],
- "source": [
- "df_981755803 = main_df[main_df[ID_COL_NAME] == '981755803']\n",
- "\n",
- "df_981755803_drug = pd.merge(df_981755803, var_drug_ann, left_on='Evidence ID', right_on='Variant Annotation ID', how='inner', suffixes=(None, '_var_drug'))\n",
- "df_981755803_pheno = pd.merge(df_981755803, var_pheno_ann, left_on='Evidence ID', right_on='Variant Annotation ID', how='inner', suffixes=(None, '_var_pheno'))\n",
- "df_981755803_fa = pd.merge(df_981755803, var_fa_ann, left_on='Evidence ID', right_on='Variant Annotation ID', how='inner', suffixes=(None, '_var_fa'))"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": 229,
- "id": "811adf62-6f79-4451-9a3e-2772057e4a01",
- "metadata": {},
- "outputs": [
- {
- "name": "stdout",
- "output_type": "stream",
- "text": [
- "Number of evidence 30\n",
- "Number of var/drug evidence 24\n",
- "Number of var/fa evidence 2\n",
- "Number of var/pheno evidence 2\n"
- ]
- }
- ],
- "source": [
- "print('Number of evidence', len(df_981755803))\n",
- "print('Number of var/drug evidence', len(df_981755803_drug))\n",
- "print('Number of var/fa evidence', len(df_981755803_fa))\n",
- "print('Number of var/pheno evidence', len(df_981755803_pheno))"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": 206,
- "id": "c4a15bc6-90fc-4d4b-bd0e-621b8ffd6093",
- "metadata": {},
"outputs": [
{
"data": {
@@ -365,23 +237,12 @@
" \n",
" \n",
" | \n",
- " Clinical Annotation ID | \n",
+ " Variant Annotation ID | \n",
" Variant/Haplotypes | \n",
" Gene | \n",
- " Level of Evidence | \n",
- " Phenotype Category | \n",
" Drug(s) | \n",
- " Phenotype(s) | \n",
- " Evidence ID | \n",
- " Evidence Type | \n",
" PMID | \n",
- " Summary | \n",
- " Variant Annotation ID | \n",
- " Variant/Haplotypes_var_drug | \n",
- " Gene_var_drug | \n",
- " Drug(s)_var_drug | \n",
- " PMID_var_drug | \n",
- " Phenotype Category_var_drug | \n",
+ " Phenotype Category | \n",
" Significance | \n",
" Notes | \n",
" Sentence | \n",
@@ -399,10 +260,1514 @@
" Comparison Allele(s) or Genotype(s) | \n",
" Comparison Metabolizer types | \n",
"
\n",
- " \n",
- "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " 1451834452 | \n",
+ " CYP3A4*1, CYP3A4*17 | \n",
+ " CYP3A4 | \n",
+ " nifedipine | \n",
+ " 15634941 | \n",
+ " Other, Metabolism/PK | \n",
+ " not stated | \n",
+ " in vitro expression of the recombinant CYP3A4*17 allelic protein and the wild-type protein | \n",
+ " CYP3A4 *17 is associated with decreased metabolism of nifedipine as compared to CYP3A4 *1. | \n",
+ " *17 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " decreased | \n",
+ " metabolism of | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " *1 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " 1451159680 | \n",
+ " rs5031016 | \n",
+ " CYP2A6 | \n",
+ " warfarin | \n",
+ " 22248286 | \n",
+ " Dosage | \n",
+ " no | \n",
+ " No association was found between this variant and warfarin-maintenance dose. Described as CYP2A6*7 in this study. | \n",
+ " Allele G is not associated with increased dose of warfarin in people with an international normalized ratio (INR) of 2.0-3.0 as compared to allele A. | \n",
+ " G | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Not associated with | \n",
+ " increased | \n",
+ " dose of | \n",
+ " NaN | \n",
+ " in people with | \n",
+ " Other:an international normalized ratio (INR) of 2.0-3.0 | \n",
+ " NaN | \n",
+ " A | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " 1451306860 | \n",
+ " CYP2C9*11 | \n",
+ " CYP2C9 | \n",
+ " warfarin | \n",
+ " 33350885 | \n",
+ " Dosage | \n",
+ " not stated | \n",
+ " \"This case suggests that CYP2C9 *11/*11 carriers require approximately two thirds less warfarin than CYP2C9\" normal function homozygotes. | \n",
+ " CYP2C9 *11/*11 is associated with decreased dose of warfarin. | \n",
+ " *11/*11 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " decreased | \n",
+ " dose of | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " 1448997750 | \n",
+ " CYP2B6*1, CYP2B6*18 | \n",
+ " CYP2B6 | \n",
+ " efavirenz | \n",
+ " 16495778 | \n",
+ " Metabolism/PK | \n",
+ " yes | \n",
+ " Please note that in the paper the allele was referred to as CYP2B6*16. CYP2B6*16 and *18 alleles have been consolidated by PharmVar in Jan 2020, with *16 now listed as a suballele of *18 (CYP2B6*18.002). This annotation is updated to be on CYP2B6*18, instead of CYP2B6*16. | \n",
+ " CYP2B6 *1/*18 is associated with increased concentrations of efavirenz in people with HIV Infections as compared to CYP2B6 *1/*1. | \n",
+ " *1/*18 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " increased | \n",
+ " concentrations of | \n",
+ " NaN | \n",
+ " in people with | \n",
+ " Disease:HIV Infections | \n",
+ " NaN | \n",
+ " *1/*1 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " 1448631821 | \n",
+ " CYP2C19*1, CYP2C19*2 | \n",
+ " CYP2C19 | \n",
+ " clomipramine, desmethyl clomipramine | \n",
+ " 28470111 | \n",
+ " Metabolism/PK | \n",
+ " no | \n",
+ " in a single individual | \n",
+ " CYP2C19 *1/*2 is associated with increased trough concentration of clomipramine and desmethyl clomipramine. | \n",
+ " *1/*2 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " increased | \n",
+ " trough concentration of | \n",
+ " and | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ "\n",
+ ""
+ ],
+ "text/plain": [
+ " Variant Annotation ID Variant/Haplotypes Gene \\\n",
+ "0 1451834452 CYP3A4*1, CYP3A4*17 CYP3A4 \n",
+ "1 1451159680 rs5031016 CYP2A6 \n",
+ "2 1451306860 CYP2C9*11 CYP2C9 \n",
+ "3 1448997750 CYP2B6*1, CYP2B6*18 CYP2B6 \n",
+ "4 1448631821 CYP2C19*1, CYP2C19*2 CYP2C19 \n",
+ "\n",
+ " Drug(s) PMID Phenotype Category \\\n",
+ "0 nifedipine 15634941 Other, Metabolism/PK \n",
+ "1 warfarin 22248286 Dosage \n",
+ "2 warfarin 33350885 Dosage \n",
+ "3 efavirenz 16495778 Metabolism/PK \n",
+ "4 clomipramine, desmethyl clomipramine 28470111 Metabolism/PK \n",
+ "\n",
+ " Significance \\\n",
+ "0 not stated \n",
+ "1 no \n",
+ "2 not stated \n",
+ "3 yes \n",
+ "4 no \n",
+ "\n",
+ " Notes \\\n",
+ "0 in vitro expression of the recombinant CYP3A4*17 allelic protein and the wild-type protein \n",
+ "1 No association was found between this variant and warfarin-maintenance dose. Described as CYP2A6*7 in this study. \n",
+ "2 \"This case suggests that CYP2C9 *11/*11 carriers require approximately two thirds less warfarin than CYP2C9\" normal function homozygotes. \n",
+ "3 Please note that in the paper the allele was referred to as CYP2B6*16. CYP2B6*16 and *18 alleles have been consolidated by PharmVar in Jan 2020, with *16 now listed as a suballele of *18 (CYP2B6*18.002). This annotation is updated to be on CYP2B6*18, instead of CYP2B6*16. \n",
+ "4 in a single individual \n",
+ "\n",
+ " Sentence \\\n",
+ "0 CYP3A4 *17 is associated with decreased metabolism of nifedipine as compared to CYP3A4 *1. \n",
+ "1 Allele G is not associated with increased dose of warfarin in people with an international normalized ratio (INR) of 2.0-3.0 as compared to allele A. \n",
+ "2 CYP2C9 *11/*11 is associated with decreased dose of warfarin. \n",
+ "3 CYP2B6 *1/*18 is associated with increased concentrations of efavirenz in people with HIV Infections as compared to CYP2B6 *1/*1. \n",
+ "4 CYP2C19 *1/*2 is associated with increased trough concentration of clomipramine and desmethyl clomipramine. \n",
+ "\n",
+ " Alleles Specialty Population Metabolizer types isPlural \\\n",
+ "0 *17 NaN NaN Is \n",
+ "1 G NaN NaN Is \n",
+ "2 *11/*11 NaN NaN Is \n",
+ "3 *1/*18 NaN NaN Is \n",
+ "4 *1/*2 NaN NaN Is \n",
+ "\n",
+ " Is/Is Not associated Direction of effect PD/PK terms \\\n",
+ "0 Associated with decreased metabolism of \n",
+ "1 Not associated with increased dose of \n",
+ "2 Associated with decreased dose of \n",
+ "3 Associated with increased concentrations of \n",
+ "4 Associated with increased trough concentration of \n",
+ "\n",
+ " Multiple drugs And/or Population types \\\n",
+ "0 NaN NaN \n",
+ "1 NaN in people with \n",
+ "2 NaN NaN \n",
+ "3 NaN in people with \n",
+ "4 and NaN \n",
+ "\n",
+ " Population Phenotypes or diseases \\\n",
+ "0 NaN \n",
+ "1 Other:an international normalized ratio (INR) of 2.0-3.0 \n",
+ "2 NaN \n",
+ "3 Disease:HIV Infections \n",
+ "4 NaN \n",
+ "\n",
+ " Multiple phenotypes or diseases And/or Comparison Allele(s) or Genotype(s) \\\n",
+ "0 NaN *1 \n",
+ "1 NaN A \n",
+ "2 NaN NaN \n",
+ "3 NaN *1/*1 \n",
+ "4 NaN NaN \n",
+ "\n",
+ " Comparison Metabolizer types \n",
+ "0 NaN \n",
+ "1 NaN \n",
+ "2 NaN \n",
+ "3 NaN \n",
+ "4 NaN "
+ ]
+ },
+ "execution_count": 245,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "# Looking at the data - output suppressed for brevity\n",
+ "var_drug_ann.head()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 246,
+ "id": "12dada29-2a14-4992-acf4-45115aed57d2",
+ "metadata": {
+ "pycharm": {
+ "name": "#%%\n"
+ },
+ "scrolled": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Variant Annotation ID | \n",
+ " Variant/Haplotypes | \n",
+ " Gene | \n",
+ " Drug(s) | \n",
+ " PMID | \n",
+ " Phenotype Category | \n",
+ " Significance | \n",
+ " Notes | \n",
+ " Sentence | \n",
+ " Alleles | \n",
+ " Specialty Population | \n",
+ " Assay type | \n",
+ " Metabolizer types | \n",
+ " isPlural | \n",
+ " Is/Is Not associated | \n",
+ " Direction of effect | \n",
+ " Functional terms | \n",
+ " Gene/gene product | \n",
+ " When treated with/exposed to/when assayed with | \n",
+ " Multiple drugs And/or | \n",
+ " Cell type | \n",
+ " Comparison Allele(s) or Genotype(s) | \n",
+ " Comparison Metabolizer types | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " 1451148445 | \n",
+ " CYP2C19*1, CYP2C19*17 | \n",
+ " CYP2C19 | \n",
+ " normeperidine | \n",
+ " 30902024 | \n",
+ " NaN | \n",
+ " not stated | \n",
+ " In other in vitro experiments, normeperidine formation was significantly correlated with CYP2C19 activity, as measured by S-mephenytoin 4-hydroxylation. | \n",
+ " CYP2C19 *17/*17 is associated with increased formation of normeperidine as compared to CYP2C19 *1/*1 + *1/*17. | \n",
+ " *17/*17 | \n",
+ " NaN | \n",
+ " in human liver microsomes | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " increased | \n",
+ " formation of | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " *1/*1 + *1/*17 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " 1447814273 | \n",
+ " rs9923231 | \n",
+ " VKORC1 | \n",
+ " NaN | \n",
+ " 26847243 | \n",
+ " Other | \n",
+ " no | \n",
+ " NaN | \n",
+ " Allele T is not associated with transcription of VKORC1 in HepG2 cells as compared to allele C. | \n",
+ " T | \n",
+ " NaN | \n",
+ " luciferase assay | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Not associated with | \n",
+ " NaN | \n",
+ " transcription of | \n",
+ " VKORC1 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " in HepG2 cells | \n",
+ " C | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " 1447814277 | \n",
+ " rs56314408 | \n",
+ " VKORC1 | \n",
+ " NaN | \n",
+ " 26847243 | \n",
+ " Other | \n",
+ " yes | \n",
+ " In the European population, this SNPs is in high LD with rs9923231 but not other populations. This SNP disrupts a binding motif for transcription factor TFAP2A/C. | \n",
+ " Allele C is associated with increased transcription of VKORC1 in HepG2 cells as compared to allele T. | \n",
+ " C | \n",
+ " NaN | \n",
+ " luciferase assay | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " increased | \n",
+ " transcription of | \n",
+ " VKORC1 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " in HepG2 cells | \n",
+ " T | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " 1447990384 | \n",
+ " rs1065852 | \n",
+ " CYP2D6 | \n",
+ " bufuralol | \n",
+ " 2211621 | \n",
+ " Metabolism/PK | \n",
+ " not stated | \n",
+ " In vitro experiments showed a significant decrease in CYP2D6 activity for the variant construct expressed in COS-1 cells as compared to wild-type. | \n",
+ " Allele A is associated with decreased activity of CYP2D6 when assayed with bufuralol in COS-1 cells as compared to allele G. | \n",
+ " A | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " decreased | \n",
+ " activity of | \n",
+ " CYP2D6 | \n",
+ " when assayed with | \n",
+ " NaN | \n",
+ " in COS-1 cells | \n",
+ " G | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " 1448281185 | \n",
+ " CYP2B6*1, CYP2B6*6 | \n",
+ " CYP2B6 | \n",
+ " bupropion | \n",
+ " 27439448 | \n",
+ " Efficacy | \n",
+ " yes | \n",
+ " The ratio of hydroxybupropion versus bupropion (AUC_hyd/ AUC_bup) in terms of area under the time-concentration curve (AUC) was used to assay CYP2B6 activity. | \n",
+ " CYP2B6 *1/*1 is associated with increased activity of CYP2B6 when assayed with bupropion as compared to CYP2B6 *1/*6. | \n",
+ " *1/*1 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " increased | \n",
+ " activity of | \n",
+ " CYP2B6 | \n",
+ " when assayed with | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " *1/*6 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Variant Annotation ID Variant/Haplotypes Gene Drug(s) \\\n",
+ "0 1451148445 CYP2C19*1, CYP2C19*17 CYP2C19 normeperidine \n",
+ "1 1447814273 rs9923231 VKORC1 NaN \n",
+ "2 1447814277 rs56314408 VKORC1 NaN \n",
+ "3 1447990384 rs1065852 CYP2D6 bufuralol \n",
+ "4 1448281185 CYP2B6*1, CYP2B6*6 CYP2B6 bupropion \n",
+ "\n",
+ " PMID Phenotype Category Significance \\\n",
+ "0 30902024 NaN not stated \n",
+ "1 26847243 Other no \n",
+ "2 26847243 Other yes \n",
+ "3 2211621 Metabolism/PK not stated \n",
+ "4 27439448 Efficacy yes \n",
+ "\n",
+ " Notes \\\n",
+ "0 In other in vitro experiments, normeperidine formation was significantly correlated with CYP2C19 activity, as measured by S-mephenytoin 4-hydroxylation. \n",
+ "1 NaN \n",
+ "2 In the European population, this SNPs is in high LD with rs9923231 but not other populations. This SNP disrupts a binding motif for transcription factor TFAP2A/C. \n",
+ "3 In vitro experiments showed a significant decrease in CYP2D6 activity for the variant construct expressed in COS-1 cells as compared to wild-type. \n",
+ "4 The ratio of hydroxybupropion versus bupropion (AUC_hyd/ AUC_bup) in terms of area under the time-concentration curve (AUC) was used to assay CYP2B6 activity. \n",
+ "\n",
+ " Sentence \\\n",
+ "0 CYP2C19 *17/*17 is associated with increased formation of normeperidine as compared to CYP2C19 *1/*1 + *1/*17. \n",
+ "1 Allele T is not associated with transcription of VKORC1 in HepG2 cells as compared to allele C. \n",
+ "2 Allele C is associated with increased transcription of VKORC1 in HepG2 cells as compared to allele T. \n",
+ "3 Allele A is associated with decreased activity of CYP2D6 when assayed with bufuralol in COS-1 cells as compared to allele G. \n",
+ "4 CYP2B6 *1/*1 is associated with increased activity of CYP2B6 when assayed with bupropion as compared to CYP2B6 *1/*6. \n",
+ "\n",
+ " Alleles Specialty Population Assay type Metabolizer types \\\n",
+ "0 *17/*17 NaN in human liver microsomes NaN \n",
+ "1 T NaN luciferase assay NaN \n",
+ "2 C NaN luciferase assay NaN \n",
+ "3 A NaN NaN NaN \n",
+ "4 *1/*1 NaN NaN NaN \n",
+ "\n",
+ " isPlural Is/Is Not associated Direction of effect Functional terms \\\n",
+ "0 Is Associated with increased formation of \n",
+ "1 Is Not associated with NaN transcription of \n",
+ "2 Is Associated with increased transcription of \n",
+ "3 Is Associated with decreased activity of \n",
+ "4 Is Associated with increased activity of \n",
+ "\n",
+ " Gene/gene product When treated with/exposed to/when assayed with \\\n",
+ "0 NaN NaN \n",
+ "1 VKORC1 NaN \n",
+ "2 VKORC1 NaN \n",
+ "3 CYP2D6 when assayed with \n",
+ "4 CYP2B6 when assayed with \n",
+ "\n",
+ " Multiple drugs And/or Cell type Comparison Allele(s) or Genotype(s) \\\n",
+ "0 NaN NaN *1/*1 + *1/*17 \n",
+ "1 NaN in HepG2 cells C \n",
+ "2 NaN in HepG2 cells T \n",
+ "3 NaN in COS-1 cells G \n",
+ "4 NaN NaN *1/*6 \n",
+ "\n",
+ " Comparison Metabolizer types \n",
+ "0 NaN \n",
+ "1 NaN \n",
+ "2 NaN \n",
+ "3 NaN \n",
+ "4 NaN "
+ ]
+ },
+ "execution_count": 246,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "var_fa_ann.head()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 247,
+ "id": "70537798-e6fb-47f5-8ba2-6859c4b645a2",
+ "metadata": {
+ "scrolled": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Variant Annotation ID | \n",
+ " Variant/Haplotypes | \n",
+ " Gene | \n",
+ " Drug(s) | \n",
+ " PMID | \n",
+ " Phenotype Category | \n",
+ " Significance | \n",
+ " Notes | \n",
+ " Sentence | \n",
+ " Alleles | \n",
+ " Specialty Population | \n",
+ " Metabolizer types | \n",
+ " isPlural | \n",
+ " Is/Is Not associated | \n",
+ " Direction of effect | \n",
+ " Side effect/efficacy/other | \n",
+ " Phenotype | \n",
+ " Multiple phenotypes And/or | \n",
+ " When treated with/exposed to/when assayed with | \n",
+ " Multiple drugs And/or | \n",
+ " Population types | \n",
+ " Population Phenotypes or diseases | \n",
+ " Multiple phenotypes or diseases And/or | \n",
+ " Comparison Allele(s) or Genotype(s) | \n",
+ " Comparison Metabolizer types | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " 1449169911 | \n",
+ " HLA-B*35:08 | \n",
+ " HLA-B | \n",
+ " lamotrigine | \n",
+ " 29238301 | \n",
+ " Toxicity | \n",
+ " no | \n",
+ " The allele was not significant when comparing allele frequency in cases of severe cutaneous adverse reactions (SCAR), Stevens-Johnson Syndrome (SJS) and Maculopapular Exanthema (MPE) (1/15) and controls (individuals without AEs who took lamotrigine) (0/50). The allele was significant when comparing between cases (1/15) and the general population (1/986). | \n",
+ " HLA-B *35:08 is not associated with likelihood of Maculopapular Exanthema, severe cutaneous adverse reactions or Stevens-Johnson Syndrome when treated with lamotrigine in people with Epilepsy. | \n",
+ " *35:08 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Not associated with | \n",
+ " NaN | \n",
+ " likelihood of | \n",
+ " Side Effect:Maculopapular Exanthema, Side Effect:severe cutaneous adverse reactions, Side Effect:Stevens-Johnson Syndrome | \n",
+ " or | \n",
+ " when treated with | \n",
+ " NaN | \n",
+ " in people with | \n",
+ " Disease:Epilepsy | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " 982022165 | \n",
+ " rs45607939 | \n",
+ " NAT2 | \n",
+ " sulfamethoxazole / trimethoprim | \n",
+ " 22850190 | \n",
+ " Toxicity | \n",
+ " no | \n",
+ " Minor allele frequencies were compared between cases (with drug-induced hypersensitivity) and controls. | \n",
+ " Allele T is not associated with increased risk of Hypersensitivity when treated with sulfamethoxazole / trimethoprim in people with Infection. | \n",
+ " T | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Not associated with | \n",
+ " increased | \n",
+ " risk of | \n",
+ " Disease:Hypersensitivity | \n",
+ " NaN | \n",
+ " when treated with | \n",
+ " NaN | \n",
+ " in people with | \n",
+ " Disease:Infection | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " 982022148 | \n",
+ " rs1799930 | \n",
+ " NAT2 | \n",
+ " sulfamethoxazole / trimethoprim | \n",
+ " 22850190 | \n",
+ " Toxicity | \n",
+ " no | \n",
+ " Minor allele frequencies were compared between cases (with drug-induced hypersensitivity) and controls. | \n",
+ " Allele A is not associated with increased risk of Hypersensitivity when treated with sulfamethoxazole / trimethoprim in people with Infection. | \n",
+ " A | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Not associated with | \n",
+ " increased | \n",
+ " risk of | \n",
+ " Disease:Hypersensitivity | \n",
+ " NaN | \n",
+ " when treated with | \n",
+ " NaN | \n",
+ " in people with | \n",
+ " Disease:Infection | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " 1451283480 | \n",
+ " rs16969968 | \n",
+ " CHRNA5 | \n",
+ " NaN | \n",
+ " 22071378 | \n",
+ " Other | \n",
+ " yes | \n",
+ " this was from meta-analysis of 27 studies but the number of total cases and the risk allele not clearly specified. Minor allele frequency was given for A allele. Introduction states that variant is Asp398Asn, where Asn (A allele) has lower nicotine response than Asp (G allele) and may be at greater risk for nicotine addiction. | \n",
+ " Allele A is associated with increased severity of Tobacco Use Disorder in people with Tobacco Use Disorder. | \n",
+ " A | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " increased | \n",
+ " severity of | \n",
+ " Other:Tobacco Use Disorder | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " in people with | \n",
+ " Other:Tobacco Use Disorder | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " 1444696916 | \n",
+ " rs267606617 | \n",
+ " MT-RNR1 | \n",
+ " streptomycin | \n",
+ " 7689389 | \n",
+ " Toxicity | \n",
+ " not stated | \n",
+ " Pedigree analysis with 3 separate families. Within the maternal lines, 15 individuals had the 1555G variant, took aminoglycoside antibiotics, and developed hearing loss. 100% of individuals with the 1555G variant who took aminoglycosides developed hearing loss. Homoplasmic. Please note that no statistical analyses were done. | \n",
+ " Allele G is associated with Ototoxicity when treated with streptomycin as compared to allele A. | \n",
+ " G | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Side Effect:Ototoxicity | \n",
+ " and | \n",
+ " when treated with | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " A | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Variant Annotation ID Variant/Haplotypes Gene \\\n",
+ "0 1449169911 HLA-B*35:08 HLA-B \n",
+ "1 982022165 rs45607939 NAT2 \n",
+ "2 982022148 rs1799930 NAT2 \n",
+ "3 1451283480 rs16969968 CHRNA5 \n",
+ "4 1444696916 rs267606617 MT-RNR1 \n",
+ "\n",
+ " Drug(s) PMID Phenotype Category Significance \\\n",
+ "0 lamotrigine 29238301 Toxicity no \n",
+ "1 sulfamethoxazole / trimethoprim 22850190 Toxicity no \n",
+ "2 sulfamethoxazole / trimethoprim 22850190 Toxicity no \n",
+ "3 NaN 22071378 Other yes \n",
+ "4 streptomycin 7689389 Toxicity not stated \n",
+ "\n",
+ " Notes \\\n",
+ "0 The allele was not significant when comparing allele frequency in cases of severe cutaneous adverse reactions (SCAR), Stevens-Johnson Syndrome (SJS) and Maculopapular Exanthema (MPE) (1/15) and controls (individuals without AEs who took lamotrigine) (0/50). The allele was significant when comparing between cases (1/15) and the general population (1/986). \n",
+ "1 Minor allele frequencies were compared between cases (with drug-induced hypersensitivity) and controls. \n",
+ "2 Minor allele frequencies were compared between cases (with drug-induced hypersensitivity) and controls. \n",
+ "3 this was from meta-analysis of 27 studies but the number of total cases and the risk allele not clearly specified. Minor allele frequency was given for A allele. Introduction states that variant is Asp398Asn, where Asn (A allele) has lower nicotine response than Asp (G allele) and may be at greater risk for nicotine addiction. \n",
+ "4 Pedigree analysis with 3 separate families. Within the maternal lines, 15 individuals had the 1555G variant, took aminoglycoside antibiotics, and developed hearing loss. 100% of individuals with the 1555G variant who took aminoglycosides developed hearing loss. Homoplasmic. Please note that no statistical analyses were done. \n",
+ "\n",
+ " Sentence \\\n",
+ "0 HLA-B *35:08 is not associated with likelihood of Maculopapular Exanthema, severe cutaneous adverse reactions or Stevens-Johnson Syndrome when treated with lamotrigine in people with Epilepsy. \n",
+ "1 Allele T is not associated with increased risk of Hypersensitivity when treated with sulfamethoxazole / trimethoprim in people with Infection. \n",
+ "2 Allele A is not associated with increased risk of Hypersensitivity when treated with sulfamethoxazole / trimethoprim in people with Infection. \n",
+ "3 Allele A is associated with increased severity of Tobacco Use Disorder in people with Tobacco Use Disorder. \n",
+ "4 Allele G is associated with Ototoxicity when treated with streptomycin as compared to allele A. \n",
+ "\n",
+ " Alleles Specialty Population Metabolizer types isPlural \\\n",
+ "0 *35:08 NaN NaN Is \n",
+ "1 T NaN NaN Is \n",
+ "2 A NaN NaN Is \n",
+ "3 A NaN NaN Is \n",
+ "4 G NaN NaN Is \n",
+ "\n",
+ " Is/Is Not associated Direction of effect Side effect/efficacy/other \\\n",
+ "0 Not associated with NaN likelihood of \n",
+ "1 Not associated with increased risk of \n",
+ "2 Not associated with increased risk of \n",
+ "3 Associated with increased severity of \n",
+ "4 Associated with NaN NaN \n",
+ "\n",
+ " Phenotype \\\n",
+ "0 Side Effect:Maculopapular Exanthema, Side Effect:severe cutaneous adverse reactions, Side Effect:Stevens-Johnson Syndrome \n",
+ "1 Disease:Hypersensitivity \n",
+ "2 Disease:Hypersensitivity \n",
+ "3 Other:Tobacco Use Disorder \n",
+ "4 Side Effect:Ototoxicity \n",
+ "\n",
+ " Multiple phenotypes And/or When treated with/exposed to/when assayed with \\\n",
+ "0 or when treated with \n",
+ "1 NaN when treated with \n",
+ "2 NaN when treated with \n",
+ "3 NaN NaN \n",
+ "4 and when treated with \n",
+ "\n",
+ " Multiple drugs And/or Population types Population Phenotypes or diseases \\\n",
+ "0 NaN in people with Disease:Epilepsy \n",
+ "1 NaN in people with Disease:Infection \n",
+ "2 NaN in people with Disease:Infection \n",
+ "3 NaN in people with Other:Tobacco Use Disorder \n",
+ "4 NaN NaN NaN \n",
+ "\n",
+ " Multiple phenotypes or diseases And/or Comparison Allele(s) or Genotype(s) \\\n",
+ "0 NaN NaN \n",
+ "1 NaN NaN \n",
+ "2 NaN NaN \n",
+ "3 NaN NaN \n",
+ "4 NaN A \n",
+ "\n",
+ " Comparison Metabolizer types \n",
+ "0 NaN \n",
+ "1 NaN \n",
+ "2 NaN \n",
+ "3 NaN \n",
+ "4 NaN "
+ ]
+ },
+ "execution_count": 247,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "var_pheno_ann.head()"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "3b84a02e-1791-4a6b-8223-d904442ddf7c",
+ "metadata": {},
+ "source": [
+ "The 3 annotations tables provide evidence for the clinical annotations, can be connected by joining with the `clinical_ann_evidence.tsv` file. In general a clinical annotation can have multiple variant annotations as evidence, and a variant annotation can be used as evidence for multiple clinical annotations (in theory, I've not actually observed this).\n",
+ "\n",
+ "Each of these tables has a \"Direction of effect\" column, and the type of \"effect\" is different for each - likelihood of side effects, formation of product, metabolism of drug, etc.\n",
+ "\n",
+ "**Question for OT**: when we say \"direction of effect\", do we mean any of these \"effects\"? I.e. should we include all three of these tables or focus on one?"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 38,
+ "id": "d43fd147-43b4-4541-9595-f757da937e60",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "clinical_annotations = read_tsv_to_df(os.path.join(data_dir, 'clinical_annotations.tsv'))\n",
+ "clinical_ann_evidence = read_tsv_to_df(os.path.join(data_dir, 'clinical_ann_evidence.tsv'))\n",
+ "clinical_ann_alleles = read_tsv_to_df(os.path.join(data_dir, 'clinical_ann_alleles.tsv'))"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 122,
+ "id": "1a553aac-a9f7-4579-ab7c-05fa6f90ddfe",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "main_df = pd.merge(clinical_annotations, clinical_ann_evidence, how='left', on=ID_COL_NAME)\n",
+ "main_df = main_df[[\n",
+ " # Main table\n",
+ " 'Clinical Annotation ID', 'Variant/Haplotypes', 'Gene', 'Level of Evidence', 'Phenotype Category', 'Drug(s)', 'Phenotype(s)',\n",
+ " # Evidence table\n",
+ " 'Evidence ID', 'Evidence Type', 'PMID', 'Summary',\n",
+ "]]"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "5945f09b-9516-4d65-ad75-d27a5a1890cf",
+ "metadata": {},
+ "source": [
+ "#### Example clinical annotation\n",
+ "\n",
+ "[Top of page](#Table-of-contents)\n",
+ "\n",
+ "Looking at [981755803](https://www.pharmgkb.org/clinicalAnnotation/981755803), which has all three types of variant annotation evidence as well as label/guideline evidence."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 124,
+ "id": "f5bb8c9e-baeb-4ef6-9373-7c38a333601c",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "df_981755803 = main_df[main_df[ID_COL_NAME] == '981755803']\n",
+ "\n",
+ "df_981755803_drug = pd.merge(df_981755803, var_drug_ann, left_on='Evidence ID', right_on='Variant Annotation ID', how='inner', suffixes=(None, '_var_drug'))\n",
+ "df_981755803_pheno = pd.merge(df_981755803, var_pheno_ann, left_on='Evidence ID', right_on='Variant Annotation ID', how='inner', suffixes=(None, '_var_pheno'))\n",
+ "df_981755803_fa = pd.merge(df_981755803, var_fa_ann, left_on='Evidence ID', right_on='Variant Annotation ID', how='inner', suffixes=(None, '_var_fa'))"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 229,
+ "id": "811adf62-6f79-4451-9a3e-2772057e4a01",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Number of evidence 30\n",
+ "Number of var/drug evidence 24\n",
+ "Number of var/fa evidence 2\n",
+ "Number of var/pheno evidence 2\n"
+ ]
+ }
+ ],
+ "source": [
+ "print('Number of evidence', len(df_981755803))\n",
+ "print('Number of var/drug evidence', len(df_981755803_drug))\n",
+ "print('Number of var/fa evidence', len(df_981755803_fa))\n",
+ "print('Number of var/pheno evidence', len(df_981755803_pheno))"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 248,
+ "id": "c4a15bc6-90fc-4d4b-bd0e-621b8ffd6093",
+ "metadata": {
+ "scrolled": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Clinical Annotation ID | \n",
+ " Variant/Haplotypes | \n",
+ " Gene | \n",
+ " Level of Evidence | \n",
+ " Phenotype Category | \n",
+ " Drug(s) | \n",
+ " Phenotype(s) | \n",
+ " Evidence ID | \n",
+ " Evidence Type | \n",
+ " PMID | \n",
+ " Summary | \n",
+ " Variant Annotation ID | \n",
+ " Variant/Haplotypes_var_drug | \n",
+ " Gene_var_drug | \n",
+ " Drug(s)_var_drug | \n",
+ " PMID_var_drug | \n",
+ " Phenotype Category_var_drug | \n",
+ " Significance | \n",
+ " Notes | \n",
+ " Sentence | \n",
+ " Alleles | \n",
+ " Specialty Population | \n",
+ " Metabolizer types | \n",
+ " isPlural | \n",
+ " Is/Is Not associated | \n",
+ " Direction of effect | \n",
+ " PD/PK terms | \n",
+ " Multiple drugs And/or | \n",
+ " Population types | \n",
+ " Population Phenotypes or diseases | \n",
+ " Multiple phenotypes or diseases And/or | \n",
+ " Comparison Allele(s) or Genotype(s) | \n",
+ " Comparison Metabolizer types | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 981755665 | \n",
+ " Variant Drug Annotation | \n",
+ " 21083385 | \n",
+ " Genotypes AA + AG are associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " 981755665 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 21083385 | \n",
+ " Efficacy | \n",
+ " not stated | \n",
+ " Clinical trials were carried out to test efficacy of ivacaftor selecting only patients with the CFTR G551D mutation on at least one allele (genotype AA or AG). | \n",
+ " Genotypes AA + AG are associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " AA + AG | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Are | \n",
+ " Associated with | \n",
+ " NaN | \n",
+ " response to | \n",
+ " NaN | \n",
+ " in people with | \n",
+ " Disease:Cystic Fibrosis | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 981755678 | \n",
+ " Variant Drug Annotation | \n",
+ " 22047557 | \n",
+ " Genotypes AA + AG are associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " 981755678 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 22047557 | \n",
+ " Efficacy | \n",
+ " not stated | \n",
+ " A clinical trial that selected patients with the G551D CFTR mutation (rs75527207 genotype AA or AG). Patients without this mutation were excluded. One patient included in the placebo group was homozygous for F508del (rs113993960 genotype del/del). | \n",
+ " Genotypes AA + AG are associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " AA + AG | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Are | \n",
+ " Associated with | \n",
+ " NaN | \n",
+ " response to | \n",
+ " NaN | \n",
+ " in people with | \n",
+ " Disease:Cystic Fibrosis | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 982009991 | \n",
+ " Variant Drug Annotation | \n",
+ " 23590265 | \n",
+ " Allele A is associated with response to ivacaftor in children with Cystic Fibrosis. | \n",
+ " 982009991 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 23590265 | \n",
+ " Efficacy | \n",
+ " yes | \n",
+ " Patients aged 6-11 at time of screening who had at least one allele with the G551D mutation (allele A at position rs75527207) were recruited for this trial. Ivacaftor is only indicated in CF patients with this mutation. Significant improvements in lung function were seen in the ivacaftor treatment group compared to placebo. | \n",
+ " Allele A is associated with response to ivacaftor in children with Cystic Fibrosis. | \n",
+ " A | \n",
+ " Pediatric | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " NaN | \n",
+ " response to | \n",
+ " NaN | \n",
+ " in children with | \n",
+ " Disease:Cystic Fibrosis | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 1183629335 | \n",
+ " Variant Drug Annotation | \n",
+ " 24066763 | \n",
+ " Genotype AA is associated with response to ivacaftor in women with Cystic Fibrosis. | \n",
+ " 1183629335 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 24066763 | \n",
+ " Efficacy | \n",
+ " not stated | \n",
+ " Case report of a female homozygous for the G551D CFTR mutation (genotype AA) in which ivacaftor was efficacious: increased absolute change in percent of predicted FEV1, increased weight and walk distance and decreased sweat chloride levels over a 12 month course with no sign of plateau to date. | \n",
+ " Genotype AA is associated with response to ivacaftor in women with Cystic Fibrosis. | \n",
+ " AA | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " NaN | \n",
+ " response to | \n",
+ " NaN | \n",
+ " in women with | \n",
+ " Disease:Cystic Fibrosis | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 1448423752 | \n",
+ " Variant Drug Annotation | \n",
+ " 27773592 | \n",
+ " Genotypes AA + AG is associated with increased response to ivacaftor in people with Cystic Fibrosis as compared to genotype GG. | \n",
+ " 1448423752 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 27773592 | \n",
+ " Efficacy | \n",
+ " yes | \n",
+ " The outcome of change in sweat chloride was correlated with change in FEV1 in patients with cystic fibrosis and found to have improved results for both. | \n",
+ " Genotypes AA + AG is associated with increased response to ivacaftor in people with Cystic Fibrosis as compared to genotype GG. | \n",
+ " AA + AG | \n",
+ " Pediatric | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " increased | \n",
+ " response to | \n",
+ " NaN | \n",
+ " in people with | \n",
+ " Disease:Cystic Fibrosis | \n",
+ " NaN | \n",
+ " GG | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 5 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 1449191908 | \n",
+ " Variant Drug Annotation | \n",
+ " 25682022 | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " 1449191908 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 25682022 | \n",
+ " Efficacy | \n",
+ " not stated | \n",
+ " Study was an expanded access program targeted at patients with severe lung disease and was not powered to determine efficacy. Majority of patients reported an improvement in FEV following 24 weeks of treatment. | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " A | \n",
+ " Pediatric | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " NaN | \n",
+ " response to | \n",
+ " NaN | \n",
+ " in people with | \n",
+ " Disease:Cystic Fibrosis | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 6 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 1449192055 | \n",
+ " Variant Drug Annotation | \n",
+ " 28711222 | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " 1449192055 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 28711222 | \n",
+ " Efficacy | \n",
+ " yes | \n",
+ " G551D allele. Statistically significant increases in FEV1, weight and BMI and statistically significant decreases in sweat chloride level, the number of days of antibiotic treatment and in the use of some maintenance treatments.; No differences in bone density, pancreatic insufficiency and cystic fibrosis related diabetes were observed. | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " A | \n",
+ " Pediatric | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " NaN | \n",
+ " response to | \n",
+ " NaN | \n",
+ " in people with | \n",
+ " Disease:Cystic Fibrosis | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 7 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 1449192093 | \n",
+ " Variant Drug Annotation | \n",
+ " 25311995 | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " 1449192093 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 25311995 | \n",
+ " Efficacy | \n",
+ " not stated | \n",
+ " G551 D allele. Increases in FEV1, body weight, CFQ-R scores and time to first pulmonary exacerbation were observed. | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " A | \n",
+ " Pediatric | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " NaN | \n",
+ " response to | \n",
+ " NaN | \n",
+ " in people with | \n",
+ " Disease:Cystic Fibrosis | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 8 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 1449192439 | \n",
+ " Variant Drug Annotation | \n",
+ " 28611235 | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " 1449192439 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 28611235 | \n",
+ " Efficacy | \n",
+ " yes | \n",
+ " G551D allele. FEV1, Alfred wellness score, exercise time, CFQ-R score and sweat chloride levels showed a significant improvement following ivacaftor treatment as compared to placebo while other outcomes (VO2, ventilation, cardiac response nd recovery following exercise) did not. | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " A | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " NaN | \n",
+ " response to | \n",
+ " NaN | \n",
+ " in people with | \n",
+ " Disease:Cystic Fibrosis | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 9 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 1449192481 | \n",
+ " Variant Drug Annotation | \n",
+ " 26135562 | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " 1449192481 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 26135562 | \n",
+ " Efficacy | \n",
+ " yes | \n",
+ " G551D allele. Analysis of CFQ-R scores from participants in the STRIVE trial. Scores for eating problems, health perceptions, physical functioning, respiratory symptoms, social functioning, treatment burden and vitality showed significant improvements following ivacaftor treatment. | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " A | \n",
+ " Pediatric | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " NaN | \n",
+ " response to | \n",
+ " NaN | \n",
+ " in people with | \n",
+ " Disease:Cystic Fibrosis | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 10 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 1449192494 | \n",
+ " Variant Drug Annotation | \n",
+ " 25171465 | \n",
+ " Allele A is associated with response to ivacaftor in children with Cystic Fibrosis. | \n",
+ " 1449192494 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 25171465 | \n",
+ " Efficacy | \n",
+ " not stated | \n",
+ " Case study of a pediatric cystic fibrosis patient. Improvements in sweat chloride, BMI, bronchiectasis and lung function reported following ivacaftor treatment. | \n",
+ " Allele A is associated with response to ivacaftor in children with Cystic Fibrosis. | \n",
+ " A | \n",
+ " Pediatric | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " NaN | \n",
+ " response to | \n",
+ " NaN | \n",
+ " in children with | \n",
+ " Disease:Cystic Fibrosis | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 11 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 1449192576 | \n",
+ " Variant Drug Annotation | \n",
+ " 25755212 | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " 1449192576 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 25755212 | \n",
+ " Efficacy | \n",
+ " yes | \n",
+ " Post hoc analysis of clinical outcomes of the STRIVE and ENVISION trials. Participants were split into tertiles based on FEV1 score and outcomes in change in baseline FEV1, body weight, CFQ-R score and sweat chloride levels as well as number of days of pulmonary exacerbation were assessed. All outcomes were significantly improved in the upper tertile, all outcomes apart from number of days of pulmonary exacerbation were significantly improved in the middle tertile and absolute change in FEV1, body weight and sweat chloride levels were significantly improved in the lower tertile. | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " A | \n",
+ " Pediatric | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " NaN | \n",
+ " response to | \n",
+ " NaN | \n",
+ " in people with | \n",
+ " Disease:Cystic Fibrosis | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 12 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 1449192615 | \n",
+ " Variant Drug Annotation | \n",
+ " 26568242 | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " 1449192615 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 26568242 | \n",
+ " Efficacy | \n",
+ " yes | \n",
+ " Response measured by changes in sweat chloride levels, FEV1 and BMI. | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " A | \n",
+ " Pediatric | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " NaN | \n",
+ " response to | \n",
+ " NaN | \n",
+ " in people with | \n",
+ " Disease:Cystic Fibrosis | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 13 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 1449192709 | \n",
+ " Variant Drug Annotation | \n",
+ " 25473543 | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " 1449192709 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 25473543 | \n",
+ " Efficacy | \n",
+ " not stated | \n",
+ " G551D allele. Case report of three patients with the F508del/G551D genotype. Reported improvements in FEV1, body weight, sweat chloride levels and scores in the respiratory domain of the CFQ-R. | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " A | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " NaN | \n",
+ " response to | \n",
+ " NaN | \n",
+ " in people with | \n",
+ " Disease:Cystic Fibrosis | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 14 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 1449192721 | \n",
+ " Variant Drug Annotation | \n",
+ " 25145599 | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " 1449192721 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 25145599 | \n",
+ " Efficacy | \n",
+ " yes | \n",
+ " G551D allele. Significant increases in %FVC and %FEV1 compared to baseline were seen at 6 months of ivacaftor treatment, but both measures declined to baseline by 12 months of ivacaftor treatment. Significant improvements in BMI, body weight, sinus disease status and sweat chloride levels were seen at 12 months of ivacaftor treatment. | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " A | \n",
+ " Pediatric | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " NaN | \n",
+ " response to | \n",
+ " NaN | \n",
+ " in people with | \n",
+ " Disease:Cystic Fibrosis | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 15 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 1450043422 | \n",
+ " Variant Drug Annotation | \n",
+ " 23628510 | \n",
+ " Allele A is associated with response to ivacaftor in children with Cystic Fibrosis. | \n",
+ " 1450043422 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 23628510 | \n",
+ " Efficacy | \n",
+ " yes | \n",
+ " NaN | \n",
+ " Allele A is associated with response to ivacaftor in children with Cystic Fibrosis. | \n",
+ " A | \n",
+ " Pediatric | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " NaN | \n",
+ " response to | \n",
+ " NaN | \n",
+ " in children with | \n",
+ " Disease:Cystic Fibrosis | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
" \n",
- " 0 | \n",
+ " 16 | \n",
" 981755803 | \n",
" rs75527207 | \n",
" CFTR | \n",
@@ -410,21 +1775,237 @@
" Efficacy | \n",
" ivacaftor | \n",
" Cystic Fibrosis | \n",
- " 981755665 | \n",
+ " 1184512440 | \n",
" Variant Drug Annotation | \n",
- " 21083385 | \n",
- " Genotypes AA + AG are associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
- " 981755665 | \n",
+ " 25049054 | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " 1184512440 | \n",
" rs75527207 | \n",
" CFTR | \n",
" ivacaftor | \n",
- " 21083385 | \n",
+ " 25049054 | \n",
+ " Efficacy | \n",
+ " yes | \n",
+ " Patients with at least one G551D-CFTR allele were recruited and treated with ivacaftor for one year. Mean weight and BMI improved at 6 months from baseline, but only mean weight was increased again at 12 months. Mean percentage FVC, FEV1 and FEF25-75% returned to baseline levels by 12 months of treatment. | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " A | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " NaN | \n",
+ " response to | \n",
+ " NaN | \n",
+ " in people with | \n",
+ " Disease:Cystic Fibrosis | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 17 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 981755746 | \n",
+ " Variant Drug Annotation | \n",
+ " 22942289 | \n",
+ " Allele A is associated with increased response to ivacaftor. | \n",
+ " 981755746 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 22942289 | \n",
" Efficacy | \n",
" not stated | \n",
- " Clinical trials were carried out to test efficacy of ivacaftor selecting only patients with the CFTR G551D mutation on at least one allele (genotype AA or AG). | \n",
+ " In vitro studies using proteoliposomes containing CFTR, or CFTR with the G551D mutation (rs75527207 allele A), or CFTR with the F508del mutation (rs113993960 allele del). Ivacaftor in the presence of ATP potentiated channel activity of CFTR-G551D. | \n",
+ " Allele A is associated with increased response to ivacaftor. | \n",
+ " A | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " increased | \n",
+ " response to | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 18 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 981755699 | \n",
+ " Variant Drug Annotation | \n",
+ " 19846789 | \n",
+ " Allele A is associated with increased response to ivacaftor. | \n",
+ " 981755699 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 19846789 | \n",
+ " Efficacy | \n",
+ " yes | \n",
+ " In vitro assays that show ivacaftor potentiates CFTR with the G551D mutation (rs75527207 allele A) - see details described in study parameters. | \n",
+ " Allele A is associated with increased response to ivacaftor. | \n",
+ " A | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " increased | \n",
+ " response to | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 19 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 981755787 | \n",
+ " Variant Drug Annotation | \n",
+ " 22293084 | \n",
+ " Allele A is associated with increased response to ivacaftor. | \n",
+ " 981755787 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 22293084 | \n",
+ " Efficacy | \n",
+ " yes | \n",
+ " as compared to baseline. In vitro assays using transfected Fisher Rat Thyroid cells expressing CFTR. Before treatment, cells were activated by exposure to PKA and ATP before ivacaftor treatment. In vitro assays using transfected Fisher Rat Thyroid cells expressing CFTR. Cells expressing G551D-CFTR (rs75527207 allele A) responded to ivacaftor treatment with a significantly enhanced channel open probability and increased chloride transport. Single channel current amplitude at 80mV was not significantly enhanced. | \n",
+ " Allele A is associated with increased response to ivacaftor. | \n",
+ " A | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " increased | \n",
+ " response to | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 20 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 1043737597 | \n",
+ " Variant Drug Annotation | \n",
+ " 23757359 | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " 1043737597 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 23757359 | \n",
+ " Efficacy | \n",
+ " yes | \n",
+ " A retrospective study of patients in Germany with severe Cystic Fibrosis (FEV1 <40%predicted) with the G551D mutation who were treated with ivacaftor. On average, FEV1and body weight increased significantly, though response was variable in this patient group and several patients discontinued ivacaftor for different complications. | \n",
+ " Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " A | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " NaN | \n",
+ " response to | \n",
+ " NaN | \n",
+ " in people with | \n",
+ " Disease:Cystic Fibrosis | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 21 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 982006840 | \n",
+ " Variant Drug Annotation | \n",
+ " 23313410 | \n",
+ " Allele A is associated with response to ivacaftor in men with Cystic Fibrosis. | \n",
+ " 982006840 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 23313410 | \n",
+ " Efficacy | \n",
+ " not stated | \n",
+ " A case report of lung function improvements 6 months after treatment with ivacaftor in a male patient with severe lung disease - he had the CFTR G511D (rsrs75527207 allele A)/deltaF508 genotype (rs113993960 del CTT) and so could be given ivacaftor. | \n",
+ " Allele A is associated with response to ivacaftor in men with Cystic Fibrosis. | \n",
+ " A | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Is | \n",
+ " Associated with | \n",
+ " NaN | \n",
+ " response to | \n",
+ " NaN | \n",
+ " in men with | \n",
+ " Disease:Cystic Fibrosis | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 22 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 1446903789 | \n",
+ " Variant Drug Annotation | \n",
+ " 24461666 | \n",
+ " Genotypes AA + AG are associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
+ " 1446903789 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 24461666 | \n",
+ " Efficacy | \n",
+ " yes | \n",
+ " The authors wanted to assess the efficacy of ivacaftor in patients with cystic fibrosis who have normal spirometry. The authors assessed lung function improvement in patients using lung clearance index (LCI) as well as forced expiratory volume in 1 second (FEV1), and only included patients with < 90% FEV1 values. The primary outcome was change in LCI from baseline. This was a phase 2, multi-centre, placebo-controlled, 2x2 crossover study. One group, sequence 1, took placebo first, followed by 28 day washout, then took ivacaftor 150 mg 2x daily for 4 weeks. The second group had the sequence of treatment reversed. | \n",
" Genotypes AA + AG are associated with response to ivacaftor in people with Cystic Fibrosis. | \n",
" AA + AG | \n",
- " NaN | \n",
+ " Pediatric | \n",
" NaN | \n",
" Are | \n",
" Associated with | \n",
@@ -437,58 +2018,393 @@
" NaN | \n",
" NaN | \n",
"
\n",
+ " \n",
+ " 23 | \n",
+ " 981755803 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " 1A | \n",
+ " Efficacy | \n",
+ " ivacaftor | \n",
+ " Cystic Fibrosis | \n",
+ " 1448099051 | \n",
+ " Variant Drug Annotation | \n",
+ " 27158673 | \n",
+ " Genotypes AA + AG are associated with increased response to ivacaftor in people with Cystic Fibrosis as compared to genotype GG. | \n",
+ " 1448099051 | \n",
+ " rs75527207 | \n",
+ " CFTR | \n",
+ " ivacaftor | \n",
+ " 27158673 | \n",
+ " Efficacy | \n",
+ " yes | \n",
+ " Measured in adult patients, with changes in lung volume, sweat chloride, distensibility, wall thickness, expiratory lumen area, and inspiratory lumen area measured before starting ivacaftor and 48 hour after starting ivacaftor. | \n",
+ " Genotypes AA + AG are associated with increased response to ivacaftor in people with Cystic Fibrosis as compared to genotype GG. | \n",
+ " AA + AG | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " Are | \n",
+ " Associated with | \n",
+ " increased | \n",
+ " response to | \n",
+ " NaN | \n",
+ " in people with | \n",
+ " Disease:Cystic Fibrosis | \n",
+ " NaN | \n",
+ " GG | \n",
+ " NaN | \n",
+ "
\n",
" \n",
"
\n",
"
"
],
"text/plain": [
- " Clinical Annotation ID Variant/Haplotypes Gene Level of Evidence \\\n",
- "0 981755803 rs75527207 CFTR 1A \n",
+ " Clinical Annotation ID Variant/Haplotypes Gene Level of Evidence \\\n",
+ "0 981755803 rs75527207 CFTR 1A \n",
+ "1 981755803 rs75527207 CFTR 1A \n",
+ "2 981755803 rs75527207 CFTR 1A \n",
+ "3 981755803 rs75527207 CFTR 1A \n",
+ "4 981755803 rs75527207 CFTR 1A \n",
+ "5 981755803 rs75527207 CFTR 1A \n",
+ "6 981755803 rs75527207 CFTR 1A \n",
+ "7 981755803 rs75527207 CFTR 1A \n",
+ "8 981755803 rs75527207 CFTR 1A \n",
+ "9 981755803 rs75527207 CFTR 1A \n",
+ "10 981755803 rs75527207 CFTR 1A \n",
+ "11 981755803 rs75527207 CFTR 1A \n",
+ "12 981755803 rs75527207 CFTR 1A \n",
+ "13 981755803 rs75527207 CFTR 1A \n",
+ "14 981755803 rs75527207 CFTR 1A \n",
+ "15 981755803 rs75527207 CFTR 1A \n",
+ "16 981755803 rs75527207 CFTR 1A \n",
+ "17 981755803 rs75527207 CFTR 1A \n",
+ "18 981755803 rs75527207 CFTR 1A \n",
+ "19 981755803 rs75527207 CFTR 1A \n",
+ "20 981755803 rs75527207 CFTR 1A \n",
+ "21 981755803 rs75527207 CFTR 1A \n",
+ "22 981755803 rs75527207 CFTR 1A \n",
+ "23 981755803 rs75527207 CFTR 1A \n",
"\n",
- " Phenotype Category Drug(s) Phenotype(s) Evidence ID \\\n",
- "0 Efficacy ivacaftor Cystic Fibrosis 981755665 \n",
+ " Phenotype Category Drug(s) Phenotype(s) Evidence ID \\\n",
+ "0 Efficacy ivacaftor Cystic Fibrosis 981755665 \n",
+ "1 Efficacy ivacaftor Cystic Fibrosis 981755678 \n",
+ "2 Efficacy ivacaftor Cystic Fibrosis 982009991 \n",
+ "3 Efficacy ivacaftor Cystic Fibrosis 1183629335 \n",
+ "4 Efficacy ivacaftor Cystic Fibrosis 1448423752 \n",
+ "5 Efficacy ivacaftor Cystic Fibrosis 1449191908 \n",
+ "6 Efficacy ivacaftor Cystic Fibrosis 1449192055 \n",
+ "7 Efficacy ivacaftor Cystic Fibrosis 1449192093 \n",
+ "8 Efficacy ivacaftor Cystic Fibrosis 1449192439 \n",
+ "9 Efficacy ivacaftor Cystic Fibrosis 1449192481 \n",
+ "10 Efficacy ivacaftor Cystic Fibrosis 1449192494 \n",
+ "11 Efficacy ivacaftor Cystic Fibrosis 1449192576 \n",
+ "12 Efficacy ivacaftor Cystic Fibrosis 1449192615 \n",
+ "13 Efficacy ivacaftor Cystic Fibrosis 1449192709 \n",
+ "14 Efficacy ivacaftor Cystic Fibrosis 1449192721 \n",
+ "15 Efficacy ivacaftor Cystic Fibrosis 1450043422 \n",
+ "16 Efficacy ivacaftor Cystic Fibrosis 1184512440 \n",
+ "17 Efficacy ivacaftor Cystic Fibrosis 981755746 \n",
+ "18 Efficacy ivacaftor Cystic Fibrosis 981755699 \n",
+ "19 Efficacy ivacaftor Cystic Fibrosis 981755787 \n",
+ "20 Efficacy ivacaftor Cystic Fibrosis 1043737597 \n",
+ "21 Efficacy ivacaftor Cystic Fibrosis 982006840 \n",
+ "22 Efficacy ivacaftor Cystic Fibrosis 1446903789 \n",
+ "23 Efficacy ivacaftor Cystic Fibrosis 1448099051 \n",
"\n",
- " Evidence Type PMID \\\n",
- "0 Variant Drug Annotation 21083385 \n",
+ " Evidence Type PMID \\\n",
+ "0 Variant Drug Annotation 21083385 \n",
+ "1 Variant Drug Annotation 22047557 \n",
+ "2 Variant Drug Annotation 23590265 \n",
+ "3 Variant Drug Annotation 24066763 \n",
+ "4 Variant Drug Annotation 27773592 \n",
+ "5 Variant Drug Annotation 25682022 \n",
+ "6 Variant Drug Annotation 28711222 \n",
+ "7 Variant Drug Annotation 25311995 \n",
+ "8 Variant Drug Annotation 28611235 \n",
+ "9 Variant Drug Annotation 26135562 \n",
+ "10 Variant Drug Annotation 25171465 \n",
+ "11 Variant Drug Annotation 25755212 \n",
+ "12 Variant Drug Annotation 26568242 \n",
+ "13 Variant Drug Annotation 25473543 \n",
+ "14 Variant Drug Annotation 25145599 \n",
+ "15 Variant Drug Annotation 23628510 \n",
+ "16 Variant Drug Annotation 25049054 \n",
+ "17 Variant Drug Annotation 22942289 \n",
+ "18 Variant Drug Annotation 19846789 \n",
+ "19 Variant Drug Annotation 22293084 \n",
+ "20 Variant Drug Annotation 23757359 \n",
+ "21 Variant Drug Annotation 23313410 \n",
+ "22 Variant Drug Annotation 24461666 \n",
+ "23 Variant Drug Annotation 27158673 \n",
"\n",
- " Summary \\\n",
- "0 Genotypes AA + AG are associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ " Summary \\\n",
+ "0 Genotypes AA + AG are associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "1 Genotypes AA + AG are associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "2 Allele A is associated with response to ivacaftor in children with Cystic Fibrosis. \n",
+ "3 Genotype AA is associated with response to ivacaftor in women with Cystic Fibrosis. \n",
+ "4 Genotypes AA + AG is associated with increased response to ivacaftor in people with Cystic Fibrosis as compared to genotype GG. \n",
+ "5 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "6 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "7 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "8 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "9 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "10 Allele A is associated with response to ivacaftor in children with Cystic Fibrosis. \n",
+ "11 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "12 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "13 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "14 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "15 Allele A is associated with response to ivacaftor in children with Cystic Fibrosis. \n",
+ "16 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "17 Allele A is associated with increased response to ivacaftor. \n",
+ "18 Allele A is associated with increased response to ivacaftor. \n",
+ "19 Allele A is associated with increased response to ivacaftor. \n",
+ "20 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "21 Allele A is associated with response to ivacaftor in men with Cystic Fibrosis. \n",
+ "22 Genotypes AA + AG are associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "23 Genotypes AA + AG are associated with increased response to ivacaftor in people with Cystic Fibrosis as compared to genotype GG. \n",
"\n",
- " Variant Annotation ID Variant/Haplotypes_var_drug Gene_var_drug \\\n",
- "0 981755665 rs75527207 CFTR \n",
+ " Variant Annotation ID Variant/Haplotypes_var_drug Gene_var_drug \\\n",
+ "0 981755665 rs75527207 CFTR \n",
+ "1 981755678 rs75527207 CFTR \n",
+ "2 982009991 rs75527207 CFTR \n",
+ "3 1183629335 rs75527207 CFTR \n",
+ "4 1448423752 rs75527207 CFTR \n",
+ "5 1449191908 rs75527207 CFTR \n",
+ "6 1449192055 rs75527207 CFTR \n",
+ "7 1449192093 rs75527207 CFTR \n",
+ "8 1449192439 rs75527207 CFTR \n",
+ "9 1449192481 rs75527207 CFTR \n",
+ "10 1449192494 rs75527207 CFTR \n",
+ "11 1449192576 rs75527207 CFTR \n",
+ "12 1449192615 rs75527207 CFTR \n",
+ "13 1449192709 rs75527207 CFTR \n",
+ "14 1449192721 rs75527207 CFTR \n",
+ "15 1450043422 rs75527207 CFTR \n",
+ "16 1184512440 rs75527207 CFTR \n",
+ "17 981755746 rs75527207 CFTR \n",
+ "18 981755699 rs75527207 CFTR \n",
+ "19 981755787 rs75527207 CFTR \n",
+ "20 1043737597 rs75527207 CFTR \n",
+ "21 982006840 rs75527207 CFTR \n",
+ "22 1446903789 rs75527207 CFTR \n",
+ "23 1448099051 rs75527207 CFTR \n",
"\n",
- " Drug(s)_var_drug PMID_var_drug Phenotype Category_var_drug Significance \\\n",
- "0 ivacaftor 21083385 Efficacy not stated \n",
+ " Drug(s)_var_drug PMID_var_drug Phenotype Category_var_drug Significance \\\n",
+ "0 ivacaftor 21083385 Efficacy not stated \n",
+ "1 ivacaftor 22047557 Efficacy not stated \n",
+ "2 ivacaftor 23590265 Efficacy yes \n",
+ "3 ivacaftor 24066763 Efficacy not stated \n",
+ "4 ivacaftor 27773592 Efficacy yes \n",
+ "5 ivacaftor 25682022 Efficacy not stated \n",
+ "6 ivacaftor 28711222 Efficacy yes \n",
+ "7 ivacaftor 25311995 Efficacy not stated \n",
+ "8 ivacaftor 28611235 Efficacy yes \n",
+ "9 ivacaftor 26135562 Efficacy yes \n",
+ "10 ivacaftor 25171465 Efficacy not stated \n",
+ "11 ivacaftor 25755212 Efficacy yes \n",
+ "12 ivacaftor 26568242 Efficacy yes \n",
+ "13 ivacaftor 25473543 Efficacy not stated \n",
+ "14 ivacaftor 25145599 Efficacy yes \n",
+ "15 ivacaftor 23628510 Efficacy yes \n",
+ "16 ivacaftor 25049054 Efficacy yes \n",
+ "17 ivacaftor 22942289 Efficacy not stated \n",
+ "18 ivacaftor 19846789 Efficacy yes \n",
+ "19 ivacaftor 22293084 Efficacy yes \n",
+ "20 ivacaftor 23757359 Efficacy yes \n",
+ "21 ivacaftor 23313410 Efficacy not stated \n",
+ "22 ivacaftor 24461666 Efficacy yes \n",
+ "23 ivacaftor 27158673 Efficacy yes \n",
"\n",
- " Notes \\\n",
- "0 Clinical trials were carried out to test efficacy of ivacaftor selecting only patients with the CFTR G551D mutation on at least one allele (genotype AA or AG). \n",
+ " Notes \\\n",
+ "0 Clinical trials were carried out to test efficacy of ivacaftor selecting only patients with the CFTR G551D mutation on at least one allele (genotype AA or AG). \n",
+ "1 A clinical trial that selected patients with the G551D CFTR mutation (rs75527207 genotype AA or AG). Patients without this mutation were excluded. One patient included in the placebo group was homozygous for F508del (rs113993960 genotype del/del). \n",
+ "2 Patients aged 6-11 at time of screening who had at least one allele with the G551D mutation (allele A at position rs75527207) were recruited for this trial. Ivacaftor is only indicated in CF patients with this mutation. Significant improvements in lung function were seen in the ivacaftor treatment group compared to placebo. \n",
+ "3 Case report of a female homozygous for the G551D CFTR mutation (genotype AA) in which ivacaftor was efficacious: increased absolute change in percent of predicted FEV1, increased weight and walk distance and decreased sweat chloride levels over a 12 month course with no sign of plateau to date. \n",
+ "4 The outcome of change in sweat chloride was correlated with change in FEV1 in patients with cystic fibrosis and found to have improved results for both. \n",
+ "5 Study was an expanded access program targeted at patients with severe lung disease and was not powered to determine efficacy. Majority of patients reported an improvement in FEV following 24 weeks of treatment. \n",
+ "6 G551D allele. Statistically significant increases in FEV1, weight and BMI and statistically significant decreases in sweat chloride level, the number of days of antibiotic treatment and in the use of some maintenance treatments.; No differences in bone density, pancreatic insufficiency and cystic fibrosis related diabetes were observed. \n",
+ "7 G551 D allele. Increases in FEV1, body weight, CFQ-R scores and time to first pulmonary exacerbation were observed. \n",
+ "8 G551D allele. FEV1, Alfred wellness score, exercise time, CFQ-R score and sweat chloride levels showed a significant improvement following ivacaftor treatment as compared to placebo while other outcomes (VO2, ventilation, cardiac response nd recovery following exercise) did not. \n",
+ "9 G551D allele. Analysis of CFQ-R scores from participants in the STRIVE trial. Scores for eating problems, health perceptions, physical functioning, respiratory symptoms, social functioning, treatment burden and vitality showed significant improvements following ivacaftor treatment. \n",
+ "10 Case study of a pediatric cystic fibrosis patient. Improvements in sweat chloride, BMI, bronchiectasis and lung function reported following ivacaftor treatment. \n",
+ "11 Post hoc analysis of clinical outcomes of the STRIVE and ENVISION trials. Participants were split into tertiles based on FEV1 score and outcomes in change in baseline FEV1, body weight, CFQ-R score and sweat chloride levels as well as number of days of pulmonary exacerbation were assessed. All outcomes were significantly improved in the upper tertile, all outcomes apart from number of days of pulmonary exacerbation were significantly improved in the middle tertile and absolute change in FEV1, body weight and sweat chloride levels were significantly improved in the lower tertile. \n",
+ "12 Response measured by changes in sweat chloride levels, FEV1 and BMI. \n",
+ "13 G551D allele. Case report of three patients with the F508del/G551D genotype. Reported improvements in FEV1, body weight, sweat chloride levels and scores in the respiratory domain of the CFQ-R. \n",
+ "14 G551D allele. Significant increases in %FVC and %FEV1 compared to baseline were seen at 6 months of ivacaftor treatment, but both measures declined to baseline by 12 months of ivacaftor treatment. Significant improvements in BMI, body weight, sinus disease status and sweat chloride levels were seen at 12 months of ivacaftor treatment. \n",
+ "15 NaN \n",
+ "16 Patients with at least one G551D-CFTR allele were recruited and treated with ivacaftor for one year. Mean weight and BMI improved at 6 months from baseline, but only mean weight was increased again at 12 months. Mean percentage FVC, FEV1 and FEF25-75% returned to baseline levels by 12 months of treatment. \n",
+ "17 In vitro studies using proteoliposomes containing CFTR, or CFTR with the G551D mutation (rs75527207 allele A), or CFTR with the F508del mutation (rs113993960 allele del). Ivacaftor in the presence of ATP potentiated channel activity of CFTR-G551D. \n",
+ "18 In vitro assays that show ivacaftor potentiates CFTR with the G551D mutation (rs75527207 allele A) - see details described in study parameters. \n",
+ "19 as compared to baseline. In vitro assays using transfected Fisher Rat Thyroid cells expressing CFTR. Before treatment, cells were activated by exposure to PKA and ATP before ivacaftor treatment. In vitro assays using transfected Fisher Rat Thyroid cells expressing CFTR. Cells expressing G551D-CFTR (rs75527207 allele A) responded to ivacaftor treatment with a significantly enhanced channel open probability and increased chloride transport. Single channel current amplitude at 80mV was not significantly enhanced. \n",
+ "20 A retrospective study of patients in Germany with severe Cystic Fibrosis (FEV1 <40%predicted) with the G551D mutation who were treated with ivacaftor. On average, FEV1and body weight increased significantly, though response was variable in this patient group and several patients discontinued ivacaftor for different complications. \n",
+ "21 A case report of lung function improvements 6 months after treatment with ivacaftor in a male patient with severe lung disease - he had the CFTR G511D (rsrs75527207 allele A)/deltaF508 genotype (rs113993960 del CTT) and so could be given ivacaftor. \n",
+ "22 The authors wanted to assess the efficacy of ivacaftor in patients with cystic fibrosis who have normal spirometry. The authors assessed lung function improvement in patients using lung clearance index (LCI) as well as forced expiratory volume in 1 second (FEV1), and only included patients with < 90% FEV1 values. The primary outcome was change in LCI from baseline. This was a phase 2, multi-centre, placebo-controlled, 2x2 crossover study. One group, sequence 1, took placebo first, followed by 28 day washout, then took ivacaftor 150 mg 2x daily for 4 weeks. The second group had the sequence of treatment reversed. \n",
+ "23 Measured in adult patients, with changes in lung volume, sweat chloride, distensibility, wall thickness, expiratory lumen area, and inspiratory lumen area measured before starting ivacaftor and 48 hour after starting ivacaftor. \n",
"\n",
- " Sentence \\\n",
- "0 Genotypes AA + AG are associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ " Sentence \\\n",
+ "0 Genotypes AA + AG are associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "1 Genotypes AA + AG are associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "2 Allele A is associated with response to ivacaftor in children with Cystic Fibrosis. \n",
+ "3 Genotype AA is associated with response to ivacaftor in women with Cystic Fibrosis. \n",
+ "4 Genotypes AA + AG is associated with increased response to ivacaftor in people with Cystic Fibrosis as compared to genotype GG. \n",
+ "5 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "6 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "7 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "8 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "9 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "10 Allele A is associated with response to ivacaftor in children with Cystic Fibrosis. \n",
+ "11 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "12 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "13 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "14 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "15 Allele A is associated with response to ivacaftor in children with Cystic Fibrosis. \n",
+ "16 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "17 Allele A is associated with increased response to ivacaftor. \n",
+ "18 Allele A is associated with increased response to ivacaftor. \n",
+ "19 Allele A is associated with increased response to ivacaftor. \n",
+ "20 Allele A is associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "21 Allele A is associated with response to ivacaftor in men with Cystic Fibrosis. \n",
+ "22 Genotypes AA + AG are associated with response to ivacaftor in people with Cystic Fibrosis. \n",
+ "23 Genotypes AA + AG are associated with increased response to ivacaftor in people with Cystic Fibrosis as compared to genotype GG. \n",
"\n",
- " Alleles Specialty Population Metabolizer types isPlural \\\n",
- "0 AA + AG NaN NaN Are \n",
+ " Alleles Specialty Population Metabolizer types isPlural \\\n",
+ "0 AA + AG NaN NaN Are \n",
+ "1 AA + AG NaN NaN Are \n",
+ "2 A Pediatric NaN Is \n",
+ "3 AA NaN NaN Is \n",
+ "4 AA + AG Pediatric NaN Is \n",
+ "5 A Pediatric NaN Is \n",
+ "6 A Pediatric NaN Is \n",
+ "7 A Pediatric NaN Is \n",
+ "8 A NaN NaN Is \n",
+ "9 A Pediatric NaN Is \n",
+ "10 A Pediatric NaN Is \n",
+ "11 A Pediatric NaN Is \n",
+ "12 A Pediatric NaN Is \n",
+ "13 A NaN NaN Is \n",
+ "14 A Pediatric NaN Is \n",
+ "15 A Pediatric NaN Is \n",
+ "16 A NaN NaN Is \n",
+ "17 A NaN NaN Is \n",
+ "18 A NaN NaN Is \n",
+ "19 A NaN NaN Is \n",
+ "20 A NaN NaN Is \n",
+ "21 A NaN NaN Is \n",
+ "22 AA + AG Pediatric NaN Are \n",
+ "23 AA + AG NaN NaN Are \n",
"\n",
- " Is/Is Not associated Direction of effect PD/PK terms Multiple drugs And/or \\\n",
- "0 Associated with NaN response to NaN \n",
+ " Is/Is Not associated Direction of effect PD/PK terms \\\n",
+ "0 Associated with NaN response to \n",
+ "1 Associated with NaN response to \n",
+ "2 Associated with NaN response to \n",
+ "3 Associated with NaN response to \n",
+ "4 Associated with increased response to \n",
+ "5 Associated with NaN response to \n",
+ "6 Associated with NaN response to \n",
+ "7 Associated with NaN response to \n",
+ "8 Associated with NaN response to \n",
+ "9 Associated with NaN response to \n",
+ "10 Associated with NaN response to \n",
+ "11 Associated with NaN response to \n",
+ "12 Associated with NaN response to \n",
+ "13 Associated with NaN response to \n",
+ "14 Associated with NaN response to \n",
+ "15 Associated with NaN response to \n",
+ "16 Associated with NaN response to \n",
+ "17 Associated with increased response to \n",
+ "18 Associated with increased response to \n",
+ "19 Associated with increased response to \n",
+ "20 Associated with NaN response to \n",
+ "21 Associated with NaN response to \n",
+ "22 Associated with NaN response to \n",
+ "23 Associated with increased response to \n",
"\n",
- " Population types Population Phenotypes or diseases \\\n",
- "0 in people with Disease:Cystic Fibrosis \n",
+ " Multiple drugs And/or Population types Population Phenotypes or diseases \\\n",
+ "0 NaN in people with Disease:Cystic Fibrosis \n",
+ "1 NaN in people with Disease:Cystic Fibrosis \n",
+ "2 NaN in children with Disease:Cystic Fibrosis \n",
+ "3 NaN in women with Disease:Cystic Fibrosis \n",
+ "4 NaN in people with Disease:Cystic Fibrosis \n",
+ "5 NaN in people with Disease:Cystic Fibrosis \n",
+ "6 NaN in people with Disease:Cystic Fibrosis \n",
+ "7 NaN in people with Disease:Cystic Fibrosis \n",
+ "8 NaN in people with Disease:Cystic Fibrosis \n",
+ "9 NaN in people with Disease:Cystic Fibrosis \n",
+ "10 NaN in children with Disease:Cystic Fibrosis \n",
+ "11 NaN in people with Disease:Cystic Fibrosis \n",
+ "12 NaN in people with Disease:Cystic Fibrosis \n",
+ "13 NaN in people with Disease:Cystic Fibrosis \n",
+ "14 NaN in people with Disease:Cystic Fibrosis \n",
+ "15 NaN in children with Disease:Cystic Fibrosis \n",
+ "16 NaN in people with Disease:Cystic Fibrosis \n",
+ "17 NaN NaN NaN \n",
+ "18 NaN NaN NaN \n",
+ "19 NaN NaN NaN \n",
+ "20 NaN in people with Disease:Cystic Fibrosis \n",
+ "21 NaN in men with Disease:Cystic Fibrosis \n",
+ "22 NaN in people with Disease:Cystic Fibrosis \n",
+ "23 NaN in people with Disease:Cystic Fibrosis \n",
"\n",
- " Multiple phenotypes or diseases And/or Comparison Allele(s) or Genotype(s) \\\n",
- "0 NaN NaN \n",
+ " Multiple phenotypes or diseases And/or Comparison Allele(s) or Genotype(s) \\\n",
+ "0 NaN NaN \n",
+ "1 NaN NaN \n",
+ "2 NaN NaN \n",
+ "3 NaN NaN \n",
+ "4 NaN GG \n",
+ "5 NaN NaN \n",
+ "6 NaN NaN \n",
+ "7 NaN NaN \n",
+ "8 NaN NaN \n",
+ "9 NaN NaN \n",
+ "10 NaN NaN \n",
+ "11 NaN NaN \n",
+ "12 NaN NaN \n",
+ "13 NaN NaN \n",
+ "14 NaN NaN \n",
+ "15 NaN NaN \n",
+ "16 NaN NaN \n",
+ "17 NaN NaN \n",
+ "18 NaN NaN \n",
+ "19 NaN NaN \n",
+ "20 NaN NaN \n",
+ "21 NaN NaN \n",
+ "22 NaN NaN \n",
+ "23 NaN GG \n",
"\n",
- " Comparison Metabolizer types \n",
- "0 NaN "
+ " Comparison Metabolizer types \n",
+ "0 NaN \n",
+ "1 NaN \n",
+ "2 NaN \n",
+ "3 NaN \n",
+ "4 NaN \n",
+ "5 NaN \n",
+ "6 NaN \n",
+ "7 NaN \n",
+ "8 NaN \n",
+ "9 NaN \n",
+ "10 NaN \n",
+ "11 NaN \n",
+ "12 NaN \n",
+ "13 NaN \n",
+ "14 NaN \n",
+ "15 NaN \n",
+ "16 NaN \n",
+ "17 NaN \n",
+ "18 NaN \n",
+ "19 NaN \n",
+ "20 NaN \n",
+ "21 NaN \n",
+ "22 NaN \n",
+ "23 NaN "
]
},
- "execution_count": 206,
+ "execution_count": 248,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
- "df_981755803_drug.head(1)"
+ "df_981755803_drug"
]
},
{
@@ -2178,10 +4094,64 @@
"* Using the additional phenotype annotations (side effect etc.) to disambiguate or supplement the phenotype information we use from the clinical annotation"
]
},
+ {
+ "cell_type": "markdown",
+ "id": "72471a5a-8c7f-4d4c-ae6f-92fa86c13d34",
+ "metadata": {},
+ "source": [
+ "## Post-meeting\n",
+ "\n",
+ "* Get a few representative (?!) examples of annotations\n",
+ "* Join with all variant evidence _and_ all clinical_alleles\n",
+ "* Dump to CSV"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 285,
+ "id": "442da098-f2a2-4436-89a0-e7a4760aad7d",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "# Build a clean table showing everything\n",
+ "complete_df = pd.merge(clinical_annotations, clinical_ann_evidence, how='left', on=ID_COL_NAME)\n",
+ "complete_df = pd.merge(complete_df, clinical_ann_alleles, how='left', on=ID_COL_NAME)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 286,
+ "id": "dc9116ed-cf4d-4c01-9a2d-f6189a77ee0e",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "def get_annotation_tables_for_ids(ca_ids):\n",
+ " df = complete_df[complete_df[ID_COL_NAME].isin({str(id) for id in ca_ids})]\n",
+ " df_drug = pd.merge(df, var_drug_ann, left_on='Evidence ID', right_on='Variant Annotation ID', how='inner', suffixes=(None, '_var_drug'))\n",
+ " df_pheno = pd.merge(df, var_pheno_ann, left_on='Evidence ID', right_on='Variant Annotation ID', how='inner', suffixes=(None, '_var_pheno'))\n",
+ " df_fa = pd.merge(df, var_fa_ann, left_on='Evidence ID', right_on='Variant Annotation ID', how='inner', suffixes=(None, '_var_fa'))\n",
+ " return df_drug, df_pheno, df_fa"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 276,
+ "id": "86bab485-ccf8-426b-9565-01fe35058871",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "example_ca_ids = [981755803, 1139506787, 1183888969, 1184514050, 981419266]\n",
+ "\n",
+ "d, p, f = get_annotation_tables_for_ids(example_ca_ids)\n",
+ "d.to_csv(f'{data_dir}/example_drug.csv', index=False)\n",
+ "p.to_csv(f'{data_dir}/example_pheno.csv', index=False)\n",
+ "f.to_csv(f'{data_dir}/example_func.csv', index=False)"
+ ]
+ },
{
"cell_type": "code",
"execution_count": null,
- "id": "c60bfd67-58b3-4264-b847-5847f6a14fce",
+ "id": "b4cee848-abf7-422d-9d64-c3c4f66f5242",
"metadata": {},
"outputs": [],
"source": []