diff --git a/api/__init__.py b/api/__init__.py
index b407f4e..8de60d4 100644
--- a/api/__init__.py
+++ b/api/__init__.py
@@ -46,7 +46,7 @@
download_database_for_eys_gene,
# Functions for storing databases
- store_database_for_eys_gene
+ download_selected_database_for_eys_gene
)
# DATA REFACTORING IMPORT
diff --git a/api/data/__init__.py b/api/data/__init__.py
index 7bfdfbe..b2bc9c1 100644
--- a/api/data/__init__.py
+++ b/api/data/__init__.py
@@ -34,7 +34,7 @@
)
# DATA COLLECTION IMPORT
-from .collection import (
+from .downloading import (
# Custom exceptions
BadResponseException,
DownloadError,
@@ -49,7 +49,7 @@
download_data_from_gnomad_eys,
# Functions for storing databases
- store_database_for_eys_gene
+ download_selected_database_for_eys_gene
)
diff --git a/api/data/constants.py b/api/data/constants.py
index 757074c..fa0060f 100644
--- a/api/data/constants.py
+++ b/api/data/constants.py
@@ -8,6 +8,7 @@
LOVD_FILE_URL = "https://databases.lovd.nl/shared/download/all/gene/"
LOVD_FILE_URL_EYS = LOVD_FILE_URL + "EYS"
STORE_AS_LOVD = "../data/lovd/lovd_data.txt"
+STORE_AS_GNOMAD = "../data/gnomad/gnomad_data.csv"
GNOMAD_URL = "https://gnomad.broadinstitute.org/gene"
GNOMAD_URL_EYS = "https://gnomad.broadinstitute.org/gene/ENSG00000188107?dataset=gnomad_r4"
diff --git a/api/data/downloading.py b/api/data/downloading.py
index 5fa786d..c253f14 100644
--- a/api/data/downloading.py
+++ b/api/data/downloading.py
@@ -18,7 +18,8 @@
LOVD_PATH,
DATABASES_DOWNLOAD_PATHS,
LOVD_FILE_URL_EYS,
- STORE_AS_LOVD)
+ STORE_AS_LOVD,
+ STORE_AS_GNOMAD)
# EXCEPTIONS
@@ -176,21 +177,36 @@ def download_database_for_eys_gene(database_name, override=False):
os.rename(latest_file, os_path)
-def store_database_for_eys_gene(database_name, override=False):
+def download_selected_database_for_eys_gene(database_name, save_path="", override=False):
"""
Calls a function to download a database.
+
:param database_name: the name of the database that should be downloaded
+ :param save_path: path to save the data
:param override: should be already existing file be overwritten
"""
+ if not isinstance(database_name, str):
+ raise TypeError("Database name should be a string")
+
database_name = database_name.lower()
+
+ # if save_path is not provided, save to default location
+ if database_name == "lovd" and save_path == "":
+ save_path = STORE_AS_LOVD
+ elif database_name == "gnomad" and save_path == "":
+ save_path = STORE_AS_GNOMAD
+
+ # check if database_name is supported
if database_name not in DATABASES_DOWNLOAD_PATHS:
- raise IndexError(f"Requested {database_name} database is not supported")
+ raise IndexError(f"Requested for {database_name} database is not supported")
+
+ # download the database
if database_name == "lovd":
- download_lovd_database_for_eys_gene(database_name, override)
+ download_lovd_database_for_eys_gene(save_path, override)
elif database_name == "gnomad":
- download_data_from_gnomad_eys(database_name, override)
+ download_data_from_gnomad_eys(save_path, override)
else:
- download_database_for_eys_gene(database_name, override)
+ raise IndexError(f"Requested for {database_name} is not yet supported")
def prepare_popmax_calculation(df, pop_data, name, pop_ids, index):
@@ -215,7 +231,7 @@ def prepare_popmax_calculation(df, pop_data, name, pop_ids, index):
df.loc[index, f'{name}_an_{variant_id}'] = pop['an']
-def download_data_from_gnomad_eys(path, override=False):
+def download_data_from_gnomad_eys(path=STORE_AS_GNOMAD, override=False):
"""
Requests gnomAD API for data about a specific gene containing:
- variant_id
@@ -226,10 +242,8 @@ def download_data_from_gnomad_eys(path, override=False):
- popmax
- popmax population
- :param str gene_name: name of gene
- :param bool to_file: if True, saves data to variants.csv
- :returns: DataFrame from gnomAD API
- :rtype: DataFrame
+ :param str path: path to save the data (default: 'data/gnomad/gnomad_eys.csv')
+ :param bool override: should an existing file be overriden with a new one
"""
if os.path.exists(path) and not override:
@@ -347,6 +361,4 @@ def download_data_from_gnomad_eys(path, override=False):
df = df.filter(not_to_drop, axis="columns")
if not os.path.isfile(path) or override:
- df.to_csv(path, index=False)
-
- return df
\ No newline at end of file
+ df.to_csv(path, index=False)
\ No newline at end of file
diff --git a/tests/pipeline2.ipynb b/tests/pipeline2.ipynb
new file mode 100644
index 0000000..4e459ea
--- /dev/null
+++ b/tests/pipeline2.ipynb
@@ -0,0 +1,4089 @@
+{
+ "cells": [
+ {
+ "cell_type": "code",
+ "id": "initial_id",
+ "metadata": {
+ "collapsed": true,
+ "jupyter": {
+ "outputs_hidden": true
+ },
+ "ExecuteTime": {
+ "end_time": "2024-09-26T20:31:26.514394Z",
+ "start_time": "2024-09-26T20:31:25.176141Z"
+ }
+ },
+ "source": [
+ "import pandas as pd\n",
+ "\n",
+ "from api.data import (download_selected_database_for_eys_gene,\n",
+ " parse_lovd,\n",
+ " LOVD_PATH,\n",
+ " set_lovd_dtypes)\n",
+ "from api.data import save_lovd_as_vcf\n",
+ "pd.options.display.max_columns = 0"
+ ],
+ "outputs": [],
+ "execution_count": 1
+ },
+ {
+ "cell_type": "code",
+ "id": "f49f7691a27aa7b4",
+ "metadata": {
+ "collapsed": false,
+ "ExecuteTime": {
+ "end_time": "2024-09-26T20:35:18.191483Z",
+ "start_time": "2024-09-26T20:32:53.778757Z"
+ }
+ },
+ "source": "download_selected_database_for_eys_gene(\"gnomad\", save_path=\"../data/gnomad/gnomad_data_text.csv\", override=False)",
+ "outputs": [],
+ "execution_count": 3
+ },
+ {
+ "metadata": {
+ "ExecuteTime": {
+ "end_time": "2024-09-26T20:36:09.300943Z",
+ "start_time": "2024-09-26T20:36:08.947865Z"
+ }
+ },
+ "cell_type": "code",
+ "source": "download_selected_database_for_eys_gene(\"lovd\", save_path=\"../data/lovd/lovd_data_text.txt\", override=False)",
+ "id": "75f1962c219b6348",
+ "outputs": [],
+ "execution_count": 5
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 2,
+ "id": "cf5c45c0f7b9de0f",
+ "metadata": {
+ "ExecuteTime": {
+ "end_time": "2024-05-13T15:38:24.591752Z",
+ "start_time": "2024-05-13T15:38:19.498594Z"
+ },
+ "collapsed": false
+ },
+ "outputs": [],
+ "source": [
+ "data = parse_lovd(LOVD_PATH + \"/lovd_data.txt\")"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 8,
+ "id": "8a089e29bfc8c119",
+ "metadata": {
+ "ExecuteTime": {
+ "end_time": "2024-05-13T15:12:07.510712Z",
+ "start_time": "2024-05-13T15:12:07.366319Z"
+ }
+ },
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Genes\n"
+ ]
+ },
+ {
+ "data": {
+ "text/html": [
+ "
\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " id | \n",
+ " name | \n",
+ " chromosome | \n",
+ " chrom_band | \n",
+ " imprinting | \n",
+ " refseq_genomic | \n",
+ " refseq_UD | \n",
+ " reference | \n",
+ " url_homepage | \n",
+ " url_external | \n",
+ " allow_download | \n",
+ " id_hgnc | \n",
+ " id_entrez | \n",
+ " id_omim | \n",
+ " show_hgmd | \n",
+ " show_genecards | \n",
+ " show_genetests | \n",
+ " show_orphanet | \n",
+ " note_index | \n",
+ " note_listing | \n",
+ " refseq | \n",
+ " refseq_url | \n",
+ " disclaimer | \n",
+ " disclaimer_text | \n",
+ " header | \n",
+ " header_align | \n",
+ " footer | \n",
+ " footer_align | \n",
+ " created_by | \n",
+ " created_date | \n",
+ " edited_by | \n",
+ " edited_date | \n",
+ " updated_by | \n",
+ " updated_date | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " EYS | \n",
+ " eyes shut homolog (Drosophila) | \n",
+ " 6 | \n",
+ " q12 | \n",
+ " unknown | \n",
+ " NG_023443.2 | \n",
+ " UD_132085377375 | \n",
+ " | \n",
+ " http://www.LOVD.nl/EYS | \n",
+ " | \n",
+ " NaN | \n",
+ " 21555 | \n",
+ " 346007 | \n",
+ " 612424 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " <font color=\\\"#FF0000\\\">This database is one o... | \n",
+ " | \n",
+ " g | \n",
+ " http://databases.lovd.nl/shared/refseq/EYS_NM_... | \n",
+ " NaN | \n",
+ " | \n",
+ " <font color=\\\"#FF0000\\\">This database is one o... | \n",
+ " -1 | \n",
+ " | \n",
+ " -1 | \n",
+ " 1 | \n",
+ " 2012-02-13 | \n",
+ " 6 | \n",
+ " 2023-08-30 13:08:19 | \n",
+ " 0 | \n",
+ " 2024-04-19 20:27:30 | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " id name ... updated_by updated_date\n",
+ "0 EYS eyes shut homolog (Drosophila) ... 0 2024-04-19 20:27:30\n",
+ "\n",
+ "[1 rows x 34 columns]"
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ },
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Transcripts\n"
+ ]
+ },
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " id | \n",
+ " geneid | \n",
+ " name | \n",
+ " id_mutalyzer | \n",
+ " id_ncbi | \n",
+ " id_ensembl | \n",
+ " id_protein_ncbi | \n",
+ " id_protein_ensembl | \n",
+ " id_protein_uniprot | \n",
+ " remarks | \n",
+ " position_c_mrna_start | \n",
+ " position_c_mrna_end | \n",
+ " position_c_cds_end | \n",
+ " position_g_mrna_start | \n",
+ " position_g_mrna_end | \n",
+ " created_by | \n",
+ " created_date | \n",
+ " edited_by | \n",
+ " edited_date | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " 7329 | \n",
+ " EYS | \n",
+ " transcript variant 1 | \n",
+ " 1 | \n",
+ " NM_001142800.1 | \n",
+ " | \n",
+ " NP_001136272.1 | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " -538 | \n",
+ " 10051 | \n",
+ " 9435 | \n",
+ " 66417118 | \n",
+ " 64429876 | \n",
+ " <NA> | \n",
+ " NaT | \n",
+ " <NA> | \n",
+ " NaT | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " id geneid name ... created_date edited_by edited_date\n",
+ "0 7329 EYS transcript variant 1 ... NaT NaT\n",
+ "\n",
+ "[1 rows x 19 columns]"
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ },
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Diseases\n"
+ ]
+ },
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " id | \n",
+ " symbol | \n",
+ " name | \n",
+ " inheritance | \n",
+ " id_omim | \n",
+ " tissues | \n",
+ " features | \n",
+ " remarks | \n",
+ " created_by | \n",
+ " created_date | \n",
+ " edited_by | \n",
+ " edited_date | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " 12 | \n",
+ " PSORS | \n",
+ " psoriasis, pustular, generalized (PSORS) | \n",
+ " | \n",
+ " <NA> | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " 6 | \n",
+ " 2012-07-06 21:50:32 | \n",
+ " 6 | \n",
+ " 2019-08-12 13:38:21 | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " 58 | \n",
+ " CORD | \n",
+ " dystrophy, cone-rod (CORD) | \n",
+ " | \n",
+ " <NA> | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " 6 | \n",
+ " 2012-09-22 11:31:25 | \n",
+ " 6 | \n",
+ " 2020-08-30 09:43:59 | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " 112 | \n",
+ " RP | \n",
+ " retinitis pigmentosa (RP) | \n",
+ " | \n",
+ " 268000 | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " 1 | \n",
+ " 2013-02-21 17:12:36 | \n",
+ " 6 | \n",
+ " 2021-01-18 09:53:26 | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " 139 | \n",
+ " ID | \n",
+ " intellectual disability (ID) | \n",
+ " | \n",
+ " <NA> | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " 84 | \n",
+ " 2013-06-04 18:18:07 | \n",
+ " 6 | \n",
+ " 2015-02-09 10:02:49 | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " 173 | \n",
+ " SLOS | \n",
+ " Smith-Lemli-Opitz syndrome (SLOS) | \n",
+ " AR | \n",
+ " 270400 | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " 6 | \n",
+ " 2013-08-01 11:16:14 | \n",
+ " 6 | \n",
+ " 2021-12-10 21:51:32 | \n",
+ "
\n",
+ " \n",
+ " 5 | \n",
+ " 198 | \n",
+ " ? | \n",
+ " unclassified / mixed | \n",
+ " | \n",
+ " <NA> | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " 6 | \n",
+ " 2013-09-13 14:21:47 | \n",
+ " 6 | \n",
+ " 2016-10-22 17:54:40 | \n",
+ "
\n",
+ " \n",
+ " 6 | \n",
+ " 2156 | \n",
+ " - | \n",
+ " retinitis pigmentosa, X-linked, and sinorespir... | \n",
+ " | \n",
+ " 300455 | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " 6 | \n",
+ " 2014-09-25 23:29:40 | \n",
+ " 6 | \n",
+ " 2021-12-10 21:51:32 | \n",
+ "
\n",
+ " \n",
+ " 7 | \n",
+ " 2440 | \n",
+ " RP25 | \n",
+ " retinitis pigmentosa, type 25 (RP25) | \n",
+ " AR | \n",
+ " 602772 | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " 6 | \n",
+ " 2014-09-25 23:29:40 | \n",
+ " 6 | \n",
+ " 2021-12-10 21:51:32 | \n",
+ "
\n",
+ " \n",
+ " 8 | \n",
+ " 4211 | \n",
+ " RPar | \n",
+ " retinitis pigmentosa, autosomal recessive (RPar) | \n",
+ " | \n",
+ " <NA> | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " 6 | \n",
+ " 2015-02-27 18:58:57 | \n",
+ " <NA> | \n",
+ " NaT | \n",
+ "
\n",
+ " \n",
+ " 9 | \n",
+ " 4214 | \n",
+ " - | \n",
+ " retinal disease | \n",
+ " | \n",
+ " <NA> | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " 6 | \n",
+ " 2015-02-27 19:48:07 | \n",
+ " 1 | \n",
+ " 2023-03-09 14:26:26 | \n",
+ "
\n",
+ " \n",
+ " 10 | \n",
+ " 4249 | \n",
+ " macular dystrophy | \n",
+ " dystrophy, macular | \n",
+ " | \n",
+ " <NA> | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " 6 | \n",
+ " 2015-05-04 22:10:58 | \n",
+ " 6 | \n",
+ " 2024-02-15 21:18:39 | \n",
+ "
\n",
+ " \n",
+ " 11 | \n",
+ " 5086 | \n",
+ " HL | \n",
+ " hearing loss (HL) | \n",
+ " | \n",
+ " <NA> | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " 6 | \n",
+ " 2015-10-23 11:41:05 | \n",
+ " 6 | \n",
+ " 2015-10-23 11:43:00 | \n",
+ "
\n",
+ " \n",
+ " 12 | \n",
+ " 5415 | \n",
+ " USH | \n",
+ " Usher syndrome (USH) | \n",
+ " | \n",
+ " <NA> | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " 6 | \n",
+ " 2018-04-02 16:40:44 | \n",
+ " <NA> | \n",
+ " NaT | \n",
+ "
\n",
+ " \n",
+ " 13 | \n",
+ " 5468 | \n",
+ " uveitis | \n",
+ " uveitis | \n",
+ " | \n",
+ " <NA> | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " 6 | \n",
+ " 2018-08-22 09:47:04 | \n",
+ " <NA> | \n",
+ " NaT | \n",
+ "
\n",
+ " \n",
+ " 14 | \n",
+ " 6906 | \n",
+ " DEE | \n",
+ " encephalopathy, developmental and epileptic | \n",
+ " | \n",
+ " <NA> | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " 6 | \n",
+ " 2022-04-07 09:24:23 | \n",
+ " <NA> | \n",
+ " NaT | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " id symbol ... edited_by edited_date\n",
+ "0 12 PSORS ... 6 2019-08-12 13:38:21\n",
+ "1 58 CORD ... 6 2020-08-30 09:43:59\n",
+ "2 112 RP ... 6 2021-01-18 09:53:26\n",
+ "3 139 ID ... 6 2015-02-09 10:02:49\n",
+ "4 173 SLOS ... 6 2021-12-10 21:51:32\n",
+ "5 198 ? ... 6 2016-10-22 17:54:40\n",
+ "6 2156 - ... 6 2021-12-10 21:51:32\n",
+ "7 2440 RP25 ... 6 2021-12-10 21:51:32\n",
+ "8 4211 RPar ... NaT\n",
+ "9 4214 - ... 1 2023-03-09 14:26:26\n",
+ "10 4249 macular dystrophy ... 6 2024-02-15 21:18:39\n",
+ "11 5086 HL ... 6 2015-10-23 11:43:00\n",
+ "12 5415 USH ... NaT\n",
+ "13 5468 uveitis ... NaT\n",
+ "14 6906 DEE ... NaT\n",
+ "\n",
+ "[15 rows x 12 columns]"
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ },
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Genes_To_Diseases\n"
+ ]
+ },
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " geneid | \n",
+ " diseaseid | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " EYS | \n",
+ " 112 | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " EYS | \n",
+ " 2440 | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " geneid diseaseid\n",
+ "0 EYS 112\n",
+ "1 EYS 2440"
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ },
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Individuals\n"
+ ]
+ },
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " id | \n",
+ " fatherid | \n",
+ " motherid | \n",
+ " panelid | \n",
+ " panel_size | \n",
+ " license | \n",
+ " owned_by | \n",
+ " Individual/Reference | \n",
+ " Individual/Remarks | \n",
+ " Individual/Gender | \n",
+ " Individual/Consanguinity | \n",
+ " Individual/Origin/Geographic | \n",
+ " Individual/Age_of_death | \n",
+ " Individual/VIP | \n",
+ " Individual/Data_av | \n",
+ " Individual/Treatment | \n",
+ " Individual/Origin/Population | \n",
+ " Individual/Individual_ID | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " 135 | \n",
+ " | \n",
+ " | \n",
+ " <NA> | \n",
+ " 3 | \n",
+ " | \n",
+ " 6 | \n",
+ " {PMID:Marrakchi 2011:21848462} | \n",
+ " 5-generation family, 3 affecteds (M) | \n",
+ " M | \n",
+ " yes | \n",
+ " Tunisia | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " 210 | \n",
+ " | \n",
+ " | \n",
+ " <NA> | \n",
+ " 1 | \n",
+ " | \n",
+ " 39 | \n",
+ " {PMID:Abu-Safieh-2013:23105016} | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " (Saudi Arabia) | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " 1962 | \n",
+ " | \n",
+ " | \n",
+ " <NA> | \n",
+ " 1 | \n",
+ " | \n",
+ " 25 | \n",
+ " | \n",
+ " | \n",
+ " M | \n",
+ " ? | \n",
+ " Germany | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " white | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " 16605 | \n",
+ " | \n",
+ " | \n",
+ " <NA> | \n",
+ " 1 | \n",
+ " | \n",
+ " 552 | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " 0 | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " 33096 | \n",
+ " | \n",
+ " | \n",
+ " <NA> | \n",
+ " 1 | \n",
+ " | \n",
+ " 229 | \n",
+ " {PMID:Neveling 2012:22334370} | \n",
+ " | \n",
+ " M | \n",
+ " no | \n",
+ " | \n",
+ " | \n",
+ " 0 | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 1445 | \n",
+ " 447702 | \n",
+ " | \n",
+ " | \n",
+ " <NA> | \n",
+ " 1 | \n",
+ " | \n",
+ " 6 | \n",
+ " {PMID:Weisschuh 2024:37734845} | \n",
+ " patient, no family history | \n",
+ " F | \n",
+ " | \n",
+ " Germany | \n",
+ " | \n",
+ " 0 | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " SRP-1105 | \n",
+ "
\n",
+ " \n",
+ " 1446 | \n",
+ " 447707 | \n",
+ " | \n",
+ " | \n",
+ " <NA> | \n",
+ " 1 | \n",
+ " | \n",
+ " 6 | \n",
+ " {PMID:Weisschuh 2024:37734845} | \n",
+ " patient, no family history | \n",
+ " M | \n",
+ " | \n",
+ " Germany | \n",
+ " | \n",
+ " 0 | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " SRP-1167 | \n",
+ "
\n",
+ " \n",
+ " 1447 | \n",
+ " 447716 | \n",
+ " | \n",
+ " | \n",
+ " <NA> | \n",
+ " 1 | \n",
+ " | \n",
+ " 6 | \n",
+ " {PMID:Weisschuh 2024:37734845} | \n",
+ " patient, no family history | \n",
+ " F | \n",
+ " | \n",
+ " Germany | \n",
+ " | \n",
+ " 0 | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " SRP-1249 | \n",
+ "
\n",
+ " \n",
+ " 1448 | \n",
+ " 447718 | \n",
+ " | \n",
+ " | \n",
+ " <NA> | \n",
+ " 1 | \n",
+ " | \n",
+ " 6 | \n",
+ " {PMID:Weisschuh 2024:37734845} | \n",
+ " patient, no family history | \n",
+ " M | \n",
+ " | \n",
+ " Germany | \n",
+ " | \n",
+ " 0 | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " SRP-1274 | \n",
+ "
\n",
+ " \n",
+ " 1449 | \n",
+ " 447720 | \n",
+ " | \n",
+ " | \n",
+ " <NA> | \n",
+ " 1 | \n",
+ " | \n",
+ " 6 | \n",
+ " {PMID:Weisschuh 2024:37734845} | \n",
+ " patient | \n",
+ " M | \n",
+ " | \n",
+ " Germany | \n",
+ " | \n",
+ " 0 | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " SRP-1299 | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
1450 rows × 18 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " id fatherid ... Individual/Origin/Population Individual/Individual_ID\n",
+ "0 135 ... \n",
+ "1 210 ... \n",
+ "2 1962 ... white \n",
+ "3 16605 ... \n",
+ "4 33096 ... \n",
+ "... ... ... ... ... ...\n",
+ "1445 447702 ... SRP-1105\n",
+ "1446 447707 ... SRP-1167\n",
+ "1447 447716 ... SRP-1249\n",
+ "1448 447718 ... SRP-1274\n",
+ "1449 447720 ... SRP-1299\n",
+ "\n",
+ "[1450 rows x 18 columns]"
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ },
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Individuals_To_Diseases\n"
+ ]
+ },
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " individualid | \n",
+ " diseaseid | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " 135 | \n",
+ " 12 | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " 210 | \n",
+ " 58 | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " 1962 | \n",
+ " 173 | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " 33096 | \n",
+ " 4214 | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " 33109 | \n",
+ " 4214 | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 1444 | \n",
+ " 447702 | \n",
+ " 198 | \n",
+ "
\n",
+ " \n",
+ " 1445 | \n",
+ " 447707 | \n",
+ " 198 | \n",
+ "
\n",
+ " \n",
+ " 1446 | \n",
+ " 447716 | \n",
+ " 198 | \n",
+ "
\n",
+ " \n",
+ " 1447 | \n",
+ " 447718 | \n",
+ " 198 | \n",
+ "
\n",
+ " \n",
+ " 1448 | \n",
+ " 447720 | \n",
+ " 198 | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
1449 rows × 2 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " individualid diseaseid\n",
+ "0 135 12\n",
+ "1 210 58\n",
+ "2 1962 173\n",
+ "3 33096 4214\n",
+ "4 33109 4214\n",
+ "... ... ...\n",
+ "1444 447702 198\n",
+ "1445 447707 198\n",
+ "1446 447716 198\n",
+ "1447 447718 198\n",
+ "1448 447720 198\n",
+ "\n",
+ "[1449 rows x 2 columns]"
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ },
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Phenotypes\n"
+ ]
+ },
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " id | \n",
+ " diseaseid | \n",
+ " individualid | \n",
+ " owned_by | \n",
+ " Phenotype/Inheritance | \n",
+ " Phenotype/Age | \n",
+ " Phenotype/Additional | \n",
+ " Phenotype/Biochem_param | \n",
+ " Phenotype/Age/Onset | \n",
+ " Phenotype/Age/Diagnosis | \n",
+ " Phenotype/Severity_score | \n",
+ " Phenotype/Onset | \n",
+ " Phenotype/Protein | \n",
+ " Phenotype/Tumor/MSI | \n",
+ " Phenotype/Enzyme/CPK | \n",
+ " Phenotype/Heart/Myocardium | \n",
+ " Phenotype/Lung | \n",
+ " Phenotype/Diagnosis/Definite | \n",
+ " Phenotype/Diagnosis/Initial | \n",
+ " Phenotype/Diagnosis/Criteria | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " 8 | \n",
+ " 12 | \n",
+ " 135 | \n",
+ " 6 | \n",
+ " Familial, autosomal recessive | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " 26 | \n",
+ " 58 | \n",
+ " 210 | \n",
+ " 39 | \n",
+ " Familial, autosomal recessive | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " 941 | \n",
+ " 173 | \n",
+ " 1962 | \n",
+ " 25 | \n",
+ " Familial | \n",
+ " | \n",
+ " 2-3 toe syndactyly | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " 5 | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " 26525 | \n",
+ " 4214 | \n",
+ " 33096 | \n",
+ " 229 | \n",
+ " Unknown | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " retinitis pigmentosa | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " 26538 | \n",
+ " 4214 | \n",
+ " 33109 | \n",
+ " 229 | \n",
+ " Unknown | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " retinitis pigmentosa | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 1266 | \n",
+ " 336901 | \n",
+ " 198 | \n",
+ " 447702 | \n",
+ " 6 | \n",
+ " Unknown | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " retinitis pigmentosa, simplex | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 1267 | \n",
+ " 336906 | \n",
+ " 198 | \n",
+ " 447707 | \n",
+ " 6 | \n",
+ " Unknown | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " retinitis pigmentosa, simplex | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 1268 | \n",
+ " 336915 | \n",
+ " 198 | \n",
+ " 447716 | \n",
+ " 6 | \n",
+ " Unknown | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " retinitis pigmentosa, simplex | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 1269 | \n",
+ " 336917 | \n",
+ " 198 | \n",
+ " 447718 | \n",
+ " 6 | \n",
+ " Unknown | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " retinitis pigmentosa, simplex | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 1270 | \n",
+ " 336919 | \n",
+ " 198 | \n",
+ " 447720 | \n",
+ " 6 | \n",
+ " Unknown | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " retinitis pigmentosa, simplex | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
1271 rows × 20 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " id ... Phenotype/Diagnosis/Criteria\n",
+ "0 8 ... \n",
+ "1 26 ... \n",
+ "2 941 ... \n",
+ "3 26525 ... \n",
+ "4 26538 ... \n",
+ "... ... ... ...\n",
+ "1266 336901 ... \n",
+ "1267 336906 ... \n",
+ "1268 336915 ... \n",
+ "1269 336917 ... \n",
+ "1270 336919 ... \n",
+ "\n",
+ "[1271 rows x 20 columns]"
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ },
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Screenings\n"
+ ]
+ },
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " id | \n",
+ " individualid | \n",
+ " variants_found | \n",
+ " owned_by | \n",
+ " created_by | \n",
+ " created_date | \n",
+ " edited_by | \n",
+ " edited_date | \n",
+ " Screening/Technique | \n",
+ " Screening/Template | \n",
+ " Screening/Tissue | \n",
+ " Screening/Remarks | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " 126 | \n",
+ " 135 | \n",
+ " 1 | \n",
+ " 6 | \n",
+ " 6 | \n",
+ " 2012-07-07 19:04:19 | \n",
+ " 6 | \n",
+ " 2012-07-07 19:12:08 | \n",
+ " RT-PCR;SEQ | \n",
+ " DNA;RNA | \n",
+ " | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " 211 | \n",
+ " 210 | \n",
+ " 1 | \n",
+ " 39 | \n",
+ " 6 | \n",
+ " 2012-09-22 11:36:24 | \n",
+ " <NA> | \n",
+ " NaT | \n",
+ " SEQ | \n",
+ " DNA | \n",
+ " | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " 1640 | \n",
+ " 1962 | \n",
+ " 1 | \n",
+ " 25 | \n",
+ " 6 | \n",
+ " 2010-03-11 16:36:41 | \n",
+ " 25 | \n",
+ " 2012-04-13 15:18:00 | \n",
+ " SEQ | \n",
+ " DNA | \n",
+ " | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " 16557 | \n",
+ " 16605 | \n",
+ " 1 | \n",
+ " 552 | \n",
+ " 552 | \n",
+ " 2014-05-23 13:12:43 | \n",
+ " <NA> | \n",
+ " NaT | \n",
+ " SEQ-NG-I | \n",
+ " DNA | \n",
+ " | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " 33164 | \n",
+ " 33096 | \n",
+ " 1 | \n",
+ " 229 | \n",
+ " 229 | \n",
+ " 2012-02-04 15:20:01 | \n",
+ " 6 | \n",
+ " 2012-05-18 13:59:33 | \n",
+ " SEQ;SEQ-NG-S | \n",
+ " DNA | \n",
+ " | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 1445 | \n",
+ " 449279 | \n",
+ " 447702 | \n",
+ " 1 | \n",
+ " 6 | \n",
+ " 6 | \n",
+ " 2024-01-26 10:23:59 | \n",
+ " <NA> | \n",
+ " NaT | \n",
+ " SEQ-NG | \n",
+ " DNA | \n",
+ " | \n",
+ " WGS | \n",
+ "
\n",
+ " \n",
+ " 1446 | \n",
+ " 449284 | \n",
+ " 447707 | \n",
+ " 1 | \n",
+ " 6 | \n",
+ " 6 | \n",
+ " 2024-01-26 10:23:59 | \n",
+ " <NA> | \n",
+ " NaT | \n",
+ " SEQ-NG | \n",
+ " DNA | \n",
+ " | \n",
+ " WGS | \n",
+ "
\n",
+ " \n",
+ " 1447 | \n",
+ " 449293 | \n",
+ " 447716 | \n",
+ " 1 | \n",
+ " 6 | \n",
+ " 6 | \n",
+ " 2024-01-26 10:23:59 | \n",
+ " <NA> | \n",
+ " NaT | \n",
+ " SEQ-NG | \n",
+ " DNA | \n",
+ " | \n",
+ " WGS | \n",
+ "
\n",
+ " \n",
+ " 1448 | \n",
+ " 449295 | \n",
+ " 447718 | \n",
+ " 1 | \n",
+ " 6 | \n",
+ " 6 | \n",
+ " 2024-01-26 10:23:59 | \n",
+ " <NA> | \n",
+ " NaT | \n",
+ " SEQ-NG | \n",
+ " DNA | \n",
+ " | \n",
+ " WGS | \n",
+ "
\n",
+ " \n",
+ " 1449 | \n",
+ " 449297 | \n",
+ " 447720 | \n",
+ " 1 | \n",
+ " 6 | \n",
+ " 6 | \n",
+ " 2024-01-26 10:23:59 | \n",
+ " <NA> | \n",
+ " NaT | \n",
+ " SEQ-NG | \n",
+ " DNA | \n",
+ " | \n",
+ " WGS | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
1450 rows × 12 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " id individualid ... Screening/Tissue Screening/Remarks\n",
+ "0 126 135 ... \n",
+ "1 211 210 ... \n",
+ "2 1640 1962 ... \n",
+ "3 16557 16605 ... \n",
+ "4 33164 33096 ... \n",
+ "... ... ... ... ... ...\n",
+ "1445 449279 447702 ... WGS\n",
+ "1446 449284 447707 ... WGS\n",
+ "1447 449293 447716 ... WGS\n",
+ "1448 449295 447718 ... WGS\n",
+ "1449 449297 447720 ... WGS\n",
+ "\n",
+ "[1450 rows x 12 columns]"
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ },
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Screenings_To_Genes\n"
+ ]
+ },
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " screeningid | \n",
+ " geneid | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " 126 | \n",
+ " IL36RN | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " 211 | \n",
+ " MKS1 | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " 1640 | \n",
+ " DHCR7 | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " 33164 | \n",
+ " AHI1 | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " 33164 | \n",
+ " EYS | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 1311 | \n",
+ " 437646 | \n",
+ " EYS | \n",
+ "
\n",
+ " \n",
+ " 1312 | \n",
+ " 437902 | \n",
+ " EYS | \n",
+ "
\n",
+ " \n",
+ " 1313 | \n",
+ " 437922 | \n",
+ " EYS | \n",
+ "
\n",
+ " \n",
+ " 1314 | \n",
+ " 443144 | \n",
+ " EYS | \n",
+ "
\n",
+ " \n",
+ " 1315 | \n",
+ " 443145 | \n",
+ " EYS | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
1316 rows × 2 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " screeningid geneid\n",
+ "0 126 IL36RN\n",
+ "1 211 MKS1\n",
+ "2 1640 DHCR7\n",
+ "3 33164 AHI1\n",
+ "4 33164 EYS\n",
+ "... ... ...\n",
+ "1311 437646 EYS\n",
+ "1312 437902 EYS\n",
+ "1313 437922 EYS\n",
+ "1314 443144 EYS\n",
+ "1315 443145 EYS\n",
+ "\n",
+ "[1316 rows x 2 columns]"
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ },
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Variants_On_Genome\n"
+ ]
+ },
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " id | \n",
+ " allele | \n",
+ " effectid | \n",
+ " chromosome | \n",
+ " position_g_start | \n",
+ " position_g_end | \n",
+ " type | \n",
+ " average_frequency | \n",
+ " owned_by | \n",
+ " VariantOnGenome/DBID | \n",
+ " VariantOnGenome/DNA | \n",
+ " VariantOnGenome/Frequency | \n",
+ " VariantOnGenome/Reference | \n",
+ " VariantOnGenome/Restriction_site | \n",
+ " VariantOnGenome/Published_as | \n",
+ " VariantOnGenome/Remarks | \n",
+ " VariantOnGenome/Genetic_origin | \n",
+ " VariantOnGenome/Segregation | \n",
+ " VariantOnGenome/dbSNP | \n",
+ " VariantOnGenome/VIP | \n",
+ " VariantOnGenome/Methylation | \n",
+ " VariantOnGenome/ISCN | \n",
+ " VariantOnGenome/DNA/hg38 | \n",
+ " VariantOnGenome/ClinVar | \n",
+ " VariantOnGenome/ClinicalClassification | \n",
+ " VariantOnGenome/ClinicalClassification/Method | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " 36426 | \n",
+ " 3 | \n",
+ " 50 | \n",
+ " 6 | \n",
+ " 64498971 | \n",
+ " 64498971 | \n",
+ " subst | \n",
+ " 0.000743 | \n",
+ " 552 | \n",
+ " EYS_000007 | \n",
+ " g.64498971A>G | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " Germline | \n",
+ " | \n",
+ " | \n",
+ " 0 | \n",
+ " | \n",
+ " | \n",
+ " g.63789078A>G | \n",
+ " | \n",
+ " VUS | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " 59881 | \n",
+ " 3 | \n",
+ " 55 | \n",
+ " 6 | \n",
+ " 65655758 | \n",
+ " 65655758 | \n",
+ " subst | \n",
+ " 0.001153 | \n",
+ " 229 | \n",
+ " EYS_000001 | \n",
+ " g.65655758T>G | \n",
+ " ExAC: 60, 19750, 0, 0.003038 | \n",
+ " {PMID:Neveling 2012:22334370} | \n",
+ " | \n",
+ " Q770P | \n",
+ " | \n",
+ " Germline | \n",
+ " yes | \n",
+ " | \n",
+ " 0 | \n",
+ " | \n",
+ " | \n",
+ " g.64945865T>G | \n",
+ " | \n",
+ " VUS | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " 59883 | \n",
+ " 1 | \n",
+ " 11 | \n",
+ " 6 | \n",
+ " 65336143 | \n",
+ " 65336143 | \n",
+ " subst | \n",
+ " 0.224189 | \n",
+ " 229 | \n",
+ " EYS_000002 | \n",
+ " g.65336143G>A | \n",
+ " ExAC: 3936, 19366, 441, 0.2032 | \n",
+ " {PMID:Neveling 2012:22334370} | \n",
+ " | \n",
+ " p.? | \n",
+ " unaffected brother also this variant homozygous | \n",
+ " Germline | \n",
+ " no | \n",
+ " | \n",
+ " 0 | \n",
+ " | \n",
+ " | \n",
+ " g.64626250G>A | \n",
+ " | \n",
+ " benign | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " 59884 | \n",
+ " 1 | \n",
+ " 15 | \n",
+ " 6 | \n",
+ " 65300869 | \n",
+ " 65300869 | \n",
+ " subst | \n",
+ " 0.000838 | \n",
+ " 229 | \n",
+ " EYS_000003 | \n",
+ " g.65300869G>A | \n",
+ " ExAC: 12, 19406, 0, 0.0006184 | \n",
+ " {PMID:Neveling 2012:22334370} | \n",
+ " | \n",
+ " (P1631S) | \n",
+ " predicted benign, disease-related variant in o... | \n",
+ " Germline | \n",
+ " | \n",
+ " | \n",
+ " 0 | \n",
+ " | \n",
+ " | \n",
+ " g.64590976G>A | \n",
+ " | \n",
+ " benign | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " 59885 | \n",
+ " 1 | \n",
+ " 11 | \n",
+ " 6 | \n",
+ " 65016998 | \n",
+ " 65016999 | \n",
+ " del | \n",
+ " 0.000000 | \n",
+ " 229 | \n",
+ " EYS_000004 | \n",
+ " g.65016998_65016999del | \n",
+ " ExAC: 9866, 18292, 921, 0.5394 | \n",
+ " {PMID:Neveling 2012:22334370} | \n",
+ " | \n",
+ " 6045-4_6045-3del | \n",
+ " predicted benign | \n",
+ " Germline | \n",
+ " yes | \n",
+ " | \n",
+ " 0 | \n",
+ " | \n",
+ " | \n",
+ " g.64307105_64307106del | \n",
+ " | \n",
+ " benign | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 2536 | \n",
+ " 964211 | \n",
+ " 0 | \n",
+ " 30 | \n",
+ " 6 | \n",
+ " 65767634 | \n",
+ " 65767634 | \n",
+ " subst | \n",
+ " 0.243022 | \n",
+ " 2330 | \n",
+ " EYS_000248 | \n",
+ " g.65767634G>A | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " EYS(NM_001292009.2):c.2024-15_2024-14delTCinsTT | \n",
+ " VKGL data sharing initiative Nederland | \n",
+ " CLASSIFICATION record | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " likely benign | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 2537 | \n",
+ " 964212 | \n",
+ " 0 | \n",
+ " 30 | \n",
+ " 6 | \n",
+ " 65767643 | \n",
+ " 65767643 | \n",
+ " del | \n",
+ " 0.000000 | \n",
+ " 2330 | \n",
+ " EYS_000926 | \n",
+ " g.65767643del | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " EYS(NM_001292009.2):c.2024-15delT | \n",
+ " VKGL data sharing initiative Nederland | \n",
+ " CLASSIFICATION record | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " likely benign | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 2538 | \n",
+ " 964215 | \n",
+ " 0 | \n",
+ " 50 | \n",
+ " 6 | \n",
+ " 66005927 | \n",
+ " 66005927 | \n",
+ " subst | \n",
+ " 0.000112 | \n",
+ " 2327 | \n",
+ " EYS_000253 | \n",
+ " g.66005927C>T | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " EYS(NM_001142800.1):c.1852G>A (p.G618S), EYS(N... | \n",
+ " VKGL data sharing initiative Nederland | \n",
+ " CLASSIFICATION record | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " VUS | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 2539 | \n",
+ " 964216 | \n",
+ " 0 | \n",
+ " 50 | \n",
+ " 6 | \n",
+ " 66044874 | \n",
+ " 66044874 | \n",
+ " subst | \n",
+ " 0.000082 | \n",
+ " 2327 | \n",
+ " EYS_000256 | \n",
+ " g.66044874T>C | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " EYS(NM_001292009.2):c.1765A>G (p.R589G) | \n",
+ " VKGL data sharing initiative Nederland | \n",
+ " CLASSIFICATION record | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " VUS | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 2540 | \n",
+ " 977314 | \n",
+ " 0 | \n",
+ " 90 | \n",
+ " 6 | \n",
+ " 64430943 | \n",
+ " 64430943 | \n",
+ " subst | \n",
+ " 0.000007 | \n",
+ " 1804 | \n",
+ " EYS_000060 | \n",
+ " g.64430943A>T | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " EYS(NM_001142800.2):c.8984T>A (p.(Ile2995Asn))... | \n",
+ " VKGL data sharing initiative Nederland | \n",
+ " CLASSIFICATION record | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " pathogenic | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
2541 rows × 26 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " id ... VariantOnGenome/ClinicalClassification/Method\n",
+ "0 36426 ... \n",
+ "1 59881 ... \n",
+ "2 59883 ... \n",
+ "3 59884 ... \n",
+ "4 59885 ... \n",
+ "... ... ... ...\n",
+ "2536 964211 ... \n",
+ "2537 964212 ... \n",
+ "2538 964215 ... \n",
+ "2539 964216 ... \n",
+ "2540 977314 ... \n",
+ "\n",
+ "[2541 rows x 26 columns]"
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ },
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Variants_On_Transcripts\n"
+ ]
+ },
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " id | \n",
+ " transcriptid | \n",
+ " effectid | \n",
+ " position_c_start | \n",
+ " position_c_start_intron | \n",
+ " position_c_end | \n",
+ " position_c_end_intron | \n",
+ " VariantOnTranscript/DNA | \n",
+ " VariantOnTranscript/RNA | \n",
+ " VariantOnTranscript/Protein | \n",
+ " VariantOnTranscript/Exon | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " 36426 | \n",
+ " 7329 | \n",
+ " 50 | \n",
+ " 7558 | \n",
+ " 0 | \n",
+ " 7558 | \n",
+ " 0 | \n",
+ " c.7558T>C | \n",
+ " r.(?) | \n",
+ " p.(Phe2520Leu) | \n",
+ " 38 | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " 59881 | \n",
+ " 7329 | \n",
+ " 55 | \n",
+ " 2309 | \n",
+ " 0 | \n",
+ " 2309 | \n",
+ " 0 | \n",
+ " c.2309A>C | \n",
+ " r.(?) | \n",
+ " p.(Gln770Pro) | \n",
+ " 15 | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " 59883 | \n",
+ " 7329 | \n",
+ " 11 | \n",
+ " 3444 | \n",
+ " -5 | \n",
+ " 3444 | \n",
+ " -5 | \n",
+ " c.3444-5C>T | \n",
+ " r.(?) | \n",
+ " p.(=) | \n",
+ " 22i | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " 59884 | \n",
+ " 7329 | \n",
+ " 15 | \n",
+ " 4891 | \n",
+ " 0 | \n",
+ " 4891 | \n",
+ " 0 | \n",
+ " c.4891C>T | \n",
+ " r.(?) | \n",
+ " p.(Pro1631Ser) | \n",
+ " 26 | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " 59885 | \n",
+ " 7329 | \n",
+ " 11 | \n",
+ " 6079 | \n",
+ " -4 | \n",
+ " 6079 | \n",
+ " -3 | \n",
+ " c.6079-4_6079-3del | \n",
+ " r.(?) | \n",
+ " p.(=) | \n",
+ " 29i | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 2536 | \n",
+ " 964211 | \n",
+ " 7329 | \n",
+ " 30 | \n",
+ " 2024 | \n",
+ " -14 | \n",
+ " 2024 | \n",
+ " -14 | \n",
+ " c.2024-14C>T | \n",
+ " r.(=) | \n",
+ " p.(=) | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 2537 | \n",
+ " 964212 | \n",
+ " 7329 | \n",
+ " 30 | \n",
+ " 2024 | \n",
+ " -15 | \n",
+ " 2024 | \n",
+ " -15 | \n",
+ " c.2024-15del | \n",
+ " r.(=) | \n",
+ " p.(=) | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 2538 | \n",
+ " 964215 | \n",
+ " 7329 | \n",
+ " 50 | \n",
+ " 1852 | \n",
+ " 0 | \n",
+ " 1852 | \n",
+ " 0 | \n",
+ " c.1852G>A | \n",
+ " r.(?) | \n",
+ " p.(Gly618Ser) | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 2539 | \n",
+ " 964216 | \n",
+ " 7329 | \n",
+ " 50 | \n",
+ " 1765 | \n",
+ " 0 | \n",
+ " 1765 | \n",
+ " 0 | \n",
+ " c.1765A>G | \n",
+ " r.(?) | \n",
+ " p.(Arg589Gly) | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " 2540 | \n",
+ " 977314 | \n",
+ " 7329 | \n",
+ " 90 | \n",
+ " 8984 | \n",
+ " 0 | \n",
+ " 8984 | \n",
+ " 0 | \n",
+ " c.8984T>A | \n",
+ " r.(?) | \n",
+ " p.(Ile2995Asn) | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
2541 rows × 11 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " id transcriptid ... VariantOnTranscript/Protein VariantOnTranscript/Exon\n",
+ "0 36426 7329 ... p.(Phe2520Leu) 38\n",
+ "1 59881 7329 ... p.(Gln770Pro) 15\n",
+ "2 59883 7329 ... p.(=) 22i\n",
+ "3 59884 7329 ... p.(Pro1631Ser) 26\n",
+ "4 59885 7329 ... p.(=) 29i\n",
+ "... ... ... ... ... ...\n",
+ "2536 964211 7329 ... p.(=) \n",
+ "2537 964212 7329 ... p.(=) \n",
+ "2538 964215 7329 ... p.(Gly618Ser) \n",
+ "2539 964216 7329 ... p.(Arg589Gly) \n",
+ "2540 977314 7329 ... p.(Ile2995Asn) \n",
+ "\n",
+ "[2541 rows x 11 columns]"
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ },
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Screenings_To_Variants\n"
+ ]
+ },
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " screeningid | \n",
+ " variantid | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " 126 | \n",
+ " 783293 | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " 211 | \n",
+ " 790459 | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " 1640 | \n",
+ " 235838 | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " 16557 | \n",
+ " 36426 | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " 33164 | \n",
+ " 59884 | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 2144 | \n",
+ " 449279 | \n",
+ " 959046 | \n",
+ "
\n",
+ " \n",
+ " 2145 | \n",
+ " 449284 | \n",
+ " 959051 | \n",
+ "
\n",
+ " \n",
+ " 2146 | \n",
+ " 449293 | \n",
+ " 959060 | \n",
+ "
\n",
+ " \n",
+ " 2147 | \n",
+ " 449295 | \n",
+ " 959474 | \n",
+ "
\n",
+ " \n",
+ " 2148 | \n",
+ " 449297 | \n",
+ " 959064 | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
2149 rows × 2 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " screeningid variantid\n",
+ "0 126 783293\n",
+ "1 211 790459\n",
+ "2 1640 235838\n",
+ "3 16557 36426\n",
+ "4 33164 59884\n",
+ "... ... ...\n",
+ "2144 449279 959046\n",
+ "2145 449284 959051\n",
+ "2146 449293 959060\n",
+ "2147 449295 959474\n",
+ "2148 449297 959064\n",
+ "\n",
+ "[2149 rows x 2 columns]"
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ }
+ ],
+ "source": [
+ "for i in data:\n",
+ " print(i)\n",
+ " display(data[i])"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "id": "ef07740b2fa63e42",
+ "metadata": {
+ "collapsed": false
+ },
+ "outputs": [],
+ "source": [
+ "set_lovd_dtypes(data)\n",
+ "for i in data:\n",
+ " print(i)\n",
+ " display(data[i].info())"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 3,
+ "id": "c968af1617be40db",
+ "metadata": {
+ "ExecuteTime": {
+ "end_time": "2024-05-13T15:38:25.149624Z",
+ "start_time": "2024-05-13T15:38:24.807199Z"
+ }
+ },
+ "outputs": [
+ {
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "WARNING:root:Skipping variant g.64307105_64307106del\n",
+ "WARNING:root:Skipping variant g.65495379dup\n",
+ "WARNING:root:Skipping variant g.65495379dup\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64902422_64902438del\n",
+ "WARNING:root:Skipping variant g.64902422_64902438del\n",
+ "WARNING:root:Skipping variant g.64840707_64997105del\n",
+ "WARNING:root:Skipping variant g.64840707_64997105del\n",
+ "WARNING:root:Skipping variant g.64840707_64997105del\n",
+ "WARNING:root:Skipping variant g.65295915del\n",
+ "WARNING:root:Skipping variant g.65295915del\n",
+ "WARNING:root:Skipping variant g.65295915del\n",
+ "WARNING:root:Skipping variant g.65057728_65320715del\n",
+ "WARNING:root:Skipping variant g.65057728_65320715del\n",
+ "WARNING:root:Skipping variant g.65057728_65320715del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.65384425del\n",
+ "WARNING:root:Skipping variant g.63720737_63720746del\n",
+ "WARNING:root:Skipping variant g.63720737_63720746del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64439165del\n",
+ "WARNING:root:Skipping variant g.64439165del\n",
+ "WARNING:root:Skipping variant g.64626122del\n",
+ "WARNING:root:Skipping variant g.65494867del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.65494867del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.65494988_65495003del\n",
+ "WARNING:root:Skipping variant g.63720919_63720920del\n",
+ "WARNING:root:Skipping variant g.63720668dup\n",
+ "WARNING:root:Skipping variant g.63720919_63720920del\n",
+ "WARNING:root:Skipping variant g.63720668dup\n",
+ "WARNING:root:Skipping variant g.63999116del\n",
+ "WARNING:root:Skipping variant g.64591039_64591042del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64822643dup\n",
+ "WARNING:root:Skipping variant g.65495005_65495008delinsAAG\n",
+ "WARNING:root:Skipping variant g.65495005_65495008delinsAAG\n",
+ "WARNING:root:Skipping variant g.65495005_65495008delinsAAG\n",
+ "WARNING:root:Skipping variant g.65495005_65495008delinsAAG\n",
+ "WARNING:root:Skipping variant g.64591505_64591506delinsCT\n",
+ "WARNING:root:Skipping variant g.65495005_65495008delinsAAG\n",
+ "WARNING:root:Skipping variant g.65495005_65495008delinsAAG\n",
+ "WARNING:root:Skipping variant g.65384480dup\n",
+ "WARNING:root:Skipping variant g.63726599_63726600del\n",
+ "WARNING:root:Skipping variant g.65495005_65495008delinsAAG\n",
+ "WARNING:root:Skipping variant g.65495005_65495008delinsAAG\n",
+ "WARNING:root:Skipping variant g.65495005_65495008delinsAAG\n",
+ "WARNING:root:Skipping variant g.63726599_63726600del\n",
+ "WARNING:root:Skipping variant g.65495005_65495008delinsAAG\n",
+ "WARNING:root:Skipping variant g.63726599_63726600del\n",
+ "WARNING:root:Skipping variant g.65335102del\n",
+ "WARNING:root:Skipping variant g.65335102del\n",
+ "WARNING:root:Skipping variant g.65335102del\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.63721377_63721384del\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.63721377_63721384del\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.63999116del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.63999110_63999111del\n",
+ "WARNING:root:Skipping variant g.63999110_63999111del\n",
+ "WARNING:root:Skipping variant g.65321830_65370656del\n",
+ "WARNING:root:Skipping variant g.63720850_63720853del\n",
+ "WARNING:root:Skipping variant g.65321830_65370656del\n",
+ "WARNING:root:Skipping variant g.63720850_63720853del\n",
+ "WARNING:root:Skipping variant g.65321830_65370656del\n",
+ "WARNING:root:Skipping variant g.63720850_63720853del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.63806240del\n",
+ "WARNING:root:Skipping variant g.63806240del\n",
+ "WARNING:root:Skipping variant g.65495332_65495333dup\n",
+ "WARNING:root:Skipping variant g.65324960_65416038del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.65295915del\n",
+ "WARNING:root:Skipping variant g.65494988_65495003del\n",
+ "WARNING:root:Skipping variant g.65494988_65495003del\n",
+ "WARNING:root:Skipping variant g.65494988_65495003del\n",
+ "WARNING:root:Skipping variant g.65494988_65495003del\n",
+ "WARNING:root:Skipping variant g.65494988_65495003del\n",
+ "WARNING:root:Skipping variant g.65494988_65495003del\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.65384480dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.65344144_65344152delinsCTTTTCG\n",
+ "WARNING:root:Skipping variant g.63984409_63984410delinsACGAT\n",
+ "WARNING:root:Skipping variant g.63788163_63788164del\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64912603dup\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590700dup\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590700dup\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64591845del\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.63984390del\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.63721651_63721652insCA\n",
+ "WARNING:root:Skipping variant g.64590665_64590666del\n",
+ "WARNING:root:Skipping variant g.63721651_63721652insCA\n",
+ "WARNING:root:Skipping variant g.64590665_64590666del\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64591466dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64591480del\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.63788136del\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.63720730_63720733del\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64912603dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590665_64590666del\n",
+ "WARNING:root:Skipping variant g.63721652_63721655dup\n",
+ "WARNING:root:Skipping variant g.64590665_64590666del\n",
+ "WARNING:root:Skipping variant g.63721652_63721655dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64912603dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64591313del\n",
+ "WARNING:root:Skipping variant g.64439355_64439356insA\n",
+ "WARNING:root:Skipping variant g.63984543_63984570del\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.63984537_63984542dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64614795_64939832del\n",
+ "WARNING:root:Skipping variant g.64614795_64939832del\n",
+ "WARNING:root:Skipping variant g.64614795_64939832del\n",
+ "WARNING:root:Skipping variant g.63721576del\n",
+ "WARNING:root:Skipping variant g.64902132_64902133del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.63720889dup\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.65495379dup\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.65495379dup\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.63721625dup\n",
+ "WARNING:root:Skipping variant g.65405300dup\n",
+ "WARNING:root:Skipping variant g.64813506del\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.63720753_63720754dup\n",
+ "WARNING:root:Skipping variant g.65405325dup\n",
+ "WARNING:root:Skipping variant g.65405325dup\n",
+ "WARNING:root:Skipping variant g.65405325dup\n",
+ "WARNING:root:Skipping variant g.65405325dup\n",
+ "WARNING:root:Skipping variant g.65405325dup\n",
+ "WARNING:root:Skipping variant g.65405325dup\n",
+ "WARNING:root:Skipping variant g.65405325dup\n",
+ "WARNING:root:Skipping variant g.65405325dup\n",
+ "WARNING:root:Skipping variant g.65405325dup\n",
+ "WARNING:root:Skipping variant g.65405325dup\n",
+ "WARNING:root:Skipping variant g.65405325dup\n",
+ "WARNING:root:Skipping variant g.65405325dup\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.65707136_65707226del\n",
+ "WARNING:root:Skipping variant g.65495348del\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.63720845_63720846del\n",
+ "WARNING:root:Skipping variant g.63726607del\n",
+ "WARNING:root:Skipping variant g.63721786dup\n",
+ "WARNING:root:Skipping variant g.63721640del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.65344138dup\n",
+ "WARNING:root:Skipping variant g.65402503del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590699_64590700del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590699_64590700del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.65384384_65384387del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.65384480dup\n",
+ "WARNING:root:Skipping variant g.63806228dup\n",
+ "WARNING:root:Skipping variant g.63999116del\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.65384384_65384387del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.63721377_63721384del\n",
+ "WARNING:root:Skipping variant g.63999110_63999111del\n",
+ "WARNING:root:Skipping variant g.63999110_63999111del\n",
+ "WARNING:root:Skipping variant g.63999110_63999111del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.64439331del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.65494957dup\n",
+ "WARNING:root:Skipping variant g.63720995del\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.63721771_63721776del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.65494957dup\n",
+ "WARNING:root:Skipping variant g.64591977del\n",
+ "WARNING:root:Skipping variant g.64886728_64886736del\n",
+ "WARNING:root:Skipping variant g.65495379dup\n",
+ "WARNING:root:Skipping variant g.63721138del\n",
+ "WARNING:root:Skipping variant g.65353541del\n",
+ "WARNING:root:Skipping variant g.65353541del\n",
+ "WARNING:root:Skipping variant g.65494988_65495002del\n",
+ "WARNING:root:Skipping variant g.65494988_65495002del\n",
+ "WARNING:root:Skipping variant g.65494988_65495002del\n",
+ "WARNING:root:Skipping variant g.65494988_65495002del\n",
+ "WARNING:root:Skipping variant g.65494988_65495002del\n",
+ "WARNING:root:Skipping variant g.65494988_65495002del\n",
+ "WARNING:root:Skipping variant g.65494988_65495002del\n",
+ "WARNING:root:Skipping variant g.65494988_65495002del\n",
+ "WARNING:root:Skipping variant g.65494988_65495002del\n",
+ "WARNING:root:Skipping variant g.65494988_65495002del\n",
+ "WARNING:root:Skipping variant g.65295857dup\n",
+ "WARNING:root:Skipping variant g.65295856_65295857dup\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.64307105_64307106del\n",
+ "WARNING:root:Skipping variant g.64307103_64307106del\n",
+ "WARNING:root:Skipping variant g.63726618_63726622del\n",
+ "WARNING:root:Skipping variant g.63720642_63720644del\n",
+ "WARNING:root:Skipping variant g.65295857dup\n",
+ "WARNING:root:Skipping variant g.64307105_64307106del\n",
+ "WARNING:root:Skipping variant g.65353541del\n",
+ "WARNING:root:Skipping variant g.64591918_64591919del\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.64590525_64590548del\n",
+ "WARNING:root:Skipping variant g.64388841_64388843del\n",
+ "WARNING:root:Skipping variant g.64307084_64307085del\n",
+ "WARNING:root:Skipping variant g.64307105_64307106del\n",
+ "WARNING:root:Skipping variant g.64307103_64307106del\n",
+ "WARNING:root:Skipping variant g.64307105_64307106del\n",
+ "WARNING:root:Skipping variant g.64593097_64593101del\n",
+ "WARNING:root:Skipping variant g.65384384_65384387del\n",
+ "WARNING:root:Skipping variant g.63999110_63999111del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.64439213del\n",
+ "WARNING:root:Skipping variant g.63721771_63721776del\n",
+ "WARNING:root:Skipping variant g.65494957dup\n",
+ "WARNING:root:Skipping variant g.65494988_65495008delinsAAAAG\n",
+ "WARNING:root:Skipping variant g.63720799_63720808del\n",
+ "WARNING:root:Skipping variant g.63726584del\n",
+ "WARNING:root:Skipping variant g.63726599_63726600del\n",
+ "WARNING:root:Skipping variant g.63726648del\n",
+ "WARNING:root:Skipping variant g.64349976_64426764del\n",
+ "WARNING:root:Skipping variant g.64591505_64591506delinsCT\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.63720728_63720729del\n",
+ "WARNING:root:Skipping variant g.63720845_63720846del\n",
+ "WARNING:root:Skipping variant g.63721162del\n",
+ "WARNING:root:Skipping variant g.63721237_63721240del\n",
+ "WARNING:root:Skipping variant g.63721343del\n",
+ "WARNING:root:Skipping variant g.63721730_63721733del\n",
+ "WARNING:root:Skipping variant g.63721763_63721767del\n",
+ "WARNING:root:Skipping variant g.63721787dup\n",
+ "WARNING:root:Skipping variant g.63726618_63726622del\n",
+ "WARNING:root:Skipping variant g.63788163_63788164del\n",
+ "WARNING:root:Skipping variant g.63984389del\n",
+ "WARNING:root:Skipping variant g.64066348del\n",
+ "WARNING:root:Skipping variant g.64590909dup\n",
+ "WARNING:root:Skipping variant g.64591309del\n",
+ "WARNING:root:Skipping variant g.64591858_64591859del\n",
+ "WARNING:root:Skipping variant g.64886728_64886736del\n",
+ "WARNING:root:Skipping variant g.64945814del\n",
+ "WARNING:root:Skipping variant g.65344143_65344144insCTTT\n",
+ "WARNING:root:Skipping variant g.65344146_65344151del\n",
+ "WARNING:root:Skipping variant g.65344181dup\n",
+ "WARNING:root:Skipping variant g.65384473dup\n",
+ "WARNING:root:Skipping variant g.65405287del\n",
+ "WARNING:root:Skipping variant g.65494885_65494887del\n",
+ "WARNING:root:Skipping variant g.65494961del\n",
+ "WARNING:root:Skipping variant g.65495205del\n",
+ "WARNING:root:Skipping variant g.65495296_65495297del\n",
+ "WARNING:root:Skipping variant g.64590909dup\n",
+ "WARNING:root:Skipping variant g.65384473dup\n",
+ "WARNING:root:Skipping variant g.65405287del\n",
+ "WARNING:root:Skipping variant g.65494885_65494887del\n",
+ "WARNING:root:Skipping variant g.63762589del\n",
+ "WARNING:root:Skipping variant g.63720874del\n",
+ "WARNING:root:Skipping variant g.63721619_63721620insGT\n",
+ "WARNING:root:Skipping variant g.63788268dup\n",
+ "WARNING:root:Skipping variant g.63984369_63984392del\n",
+ "WARNING:root:Skipping variant g.65057740_65057741insA\n",
+ "WARNING:root:Skipping variant g.65057740_65057741insAA\n",
+ "WARNING:root:Skipping variant g.65057750dup\n",
+ "WARNING:root:Skipping variant g.65384384_65384387del\n",
+ "WARNING:root:Skipping variant g.65402624dup\n",
+ "WARNING:root:Skipping variant g.65405377dup\n",
+ "WARNING:root:Skipping variant g.65494957dup\n",
+ "WARNING:root:Skipping variant g.65494957dup\n",
+ "WARNING:root:Skipping variant g.65495379dup\n",
+ "WARNING:root:Skipping variant g.63721625dup\n",
+ "WARNING:root:Skipping variant g.63721704dup\n",
+ "WARNING:root:Skipping variant g.65353537dup\n",
+ "WARNING:root:Skipping variant g.65335105_65335108del\n",
+ "WARNING:root:Skipping variant g.63721385_63721386del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64439195del\n",
+ "WARNING:root:Skipping variant g.63721377_63721384del\n",
+ "WARNING:root:Skipping variant g.63720867_63720868del\n",
+ "WARNING:root:Skipping variant g.63721314_63721321del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.63720737_63720746del\n",
+ "WARNING:root:Skipping variant g.63720737_63720746del\n",
+ "WARNING:root:Skipping variant g.63720737_63720746del\n",
+ "WARNING:root:Skipping variant g.63720737_63720746del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.63765706_63791377del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.63781919_63803805del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64892926_64948294del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64591845del\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64945857dup\n",
+ "WARNING:root:Skipping variant g.63721377_63721384del\n",
+ "WARNING:root:Skipping variant g.63721377_63721384del\n",
+ "WARNING:root:Skipping variant g.63721377_63721384del\n",
+ "WARNING:root:Skipping variant g.63721377_63721384del\n",
+ "WARNING:root:Skipping variant g.63721557_63721558insA\n",
+ "WARNING:root:Skipping variant g.64439319_64439323del\n",
+ "WARNING:root:Skipping variant g.65296021del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.65495181del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.65384425del\n",
+ "WARNING:root:Skipping variant g.64591039_64591042del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.63721599_63721604del\n",
+ "WARNING:root:Skipping variant g.64902132_64902133del\n",
+ "WARNING:root:Skipping variant g.65494988_65495008delinsAAAAG\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.65495236del\n",
+ "WARNING:root:Skipping variant g.64590908_64590909insT\n",
+ "WARNING:root:Skipping variant g.64617409_64617411dup\n",
+ "WARNING:root:Skipping variant g.65295857dup\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.63720845_63720846del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.63720668dup\n",
+ "WARNING:root:Skipping variant g.(63741975_63762461)_(63778180_63788105)dup\n",
+ "WARNING:root:Skipping variant g.65296051_65296052del\n",
+ "WARNING:root:Skipping variant g.65296051_65296052del\n",
+ "WARNING:root:Skipping variant g.64439200dup\n",
+ "WARNING:root:Skipping variant g.63720737_63720746del\n",
+ "WARNING:root:Skipping variant g.63720737_63720746del\n",
+ "WARNING:root:Skipping variant g.65494885_65494887del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.63984390del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.65295897del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.65494885_65494887del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590615dup\n",
+ "WARNING:root:Skipping variant g.63721705del\n",
+ "WARNING:root:Skipping variant g.64081884del\n",
+ "WARNING:root:Skipping variant g.65405342_65405355delinsAAA\n",
+ "WARNING:root:Skipping variant g.65490640_65490643dup\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.65296058del\n",
+ "WARNING:root:Skipping variant g.65405345del\n",
+ "WARNING:root:Skipping variant g.(65405368_65490593)_(65495411_?)del\n",
+ "WARNING:root:Skipping variant g.(65353618_65384385)_(65405368_65490593)del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64081885_64081888del\n",
+ "WARNING:root:Skipping variant g.64591401_64591408dup\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.63721377_63721384del\n",
+ "WARNING:root:Skipping variant g.63721237_63721240del\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.64591256_64591272del\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.63721436del\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.64591039_64591042del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.65495181del\n",
+ "WARNING:root:Skipping variant g.65495181del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.65495181del\n",
+ "WARNING:root:Skipping variant g.65495181del\n",
+ "WARNING:root:Skipping variant g.63720695_63720714del\n",
+ "WARNING:root:Skipping variant g.65384480dup\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.63721377_63721384del\n",
+ "WARNING:root:Skipping variant g.65495181del\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.65495181del\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.65495064del\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.63721377_63721384del\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.65495181del\n",
+ "WARNING:root:Skipping variant g.64066470_64066473del\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.65495181del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.65495181del\n",
+ "WARNING:root:Skipping variant g.64066470_64066473del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.63721377_63721384del\n",
+ "WARNING:root:Skipping variant g.65495181del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.63721377_63721384del\n",
+ "WARNING:root:Skipping variant g.65495181del\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.63720695_63720714del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.63720668del\n",
+ "WARNING:root:Skipping variant g.64912603dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.63720730_63720733del\n",
+ "WARNING:root:Skipping variant g.64902132_64902133del\n",
+ "WARNING:root:Skipping variant g.63720954dup\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.64066335del\n",
+ "WARNING:root:Skipping variant g.64886711del\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.63778166_63778172del\n",
+ "WARNING:root:Skipping variant g.64590914dup\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.63726618_63726622del\n",
+ "WARNING:root:Skipping variant g.64886728_64886736del\n",
+ "WARNING:root:Skipping variant g.64893157_64947352del\n",
+ "WARNING:root:Skipping variant g.64797009_64846087del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.63726519del\n",
+ "WARNING:root:Skipping variant g.64997275_64998015del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.64081605_64082252del\n",
+ "WARNING:root:Skipping variant g.63777755_63789474dup\n",
+ "WARNING:root:Skipping variant g.63720737_63720746del\n",
+ "WARNING:root:Skipping variant g.64081605_64082252del\n",
+ "WARNING:root:Skipping variant g.65353208_65353867del\n",
+ "WARNING:root:Skipping variant g.63984134_63984854del\n",
+ "WARNING:root:Skipping variant g.63743557_63907234del\n",
+ "WARNING:root:Skipping variant g.63720737_63720746del\n",
+ "WARNING:root:Skipping variant g.64662532_64979780del\n",
+ "WARNING:root:Skipping variant g.64839119_64970113del\n",
+ "WARNING:root:Skipping variant g.63720872_63720873del\n",
+ "WARNING:root:Skipping variant g.63721377_63721384del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.64081885_64081888del\n",
+ "WARNING:root:Skipping variant g.63720737_63720746del\n",
+ "WARNING:root:Skipping variant g.63720737_63720746del\n",
+ "WARNING:root:Skipping variant g.63720682dup\n",
+ "WARNING:root:Skipping variant g.63721619dup\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.64388841del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.63720649_63720653del\n",
+ "WARNING:root:Skipping variant g.63721377_63721384del\n",
+ "WARNING:root:Skipping variant g.63720695_63720714del\n",
+ "WARNING:root:Skipping variant g.65384384_65384387del\n",
+ "WARNING:root:Skipping variant g.63720730_63720733del\n",
+ "WARNING:root:Skipping variant g.65335105_65335108del\n",
+ "WARNING:root:Skipping variant g.64439165del\n",
+ "WARNING:root:Skipping variant g.63999116del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.63998527_64002156del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.63721377_63721384del\n",
+ "WARNING:root:Skipping variant g.65495379dup\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.63720730_63720733del\n",
+ "WARNING:root:Skipping variant g.63720730_63720733del\n",
+ "WARNING:root:Skipping variant g.63721237_63721240del\n",
+ "WARNING:root:Skipping variant g.63721237_63721240del\n",
+ "WARNING:root:Skipping variant g.63721237_63721240del\n",
+ "WARNING:root:Skipping variant g.64081885_64081888del\n",
+ "WARNING:root:Skipping variant g.65495348dup\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.64439331del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.64912705del\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.64439200dup\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.65495181del\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.63721625dup\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.65384480del\n",
+ "WARNING:root:Skipping variant g.64388841_64388843del\n",
+ "WARNING:root:Skipping variant g.63998527_64002156del\n",
+ "WARNING:root:Skipping variant g.64590525_64590550delinsTA\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64081884del\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.216327637C>T\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.215879068C>T\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.215878931del\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.65384480dup\n",
+ "WARNING:root:Skipping variant g.216073265G>A\n",
+ "WARNING:root:Skipping variant g.65495206_65495207insTGCCAGTTTA\n",
+ "WARNING:root:Skipping variant g.63721227dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.63720990_63720991insATAT\n",
+ "WARNING:root:Skipping variant g.63720728_63720729del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.63720947_63720948insT\n",
+ "WARNING:root:Skipping variant g.64590875_64590876insTCTT\n",
+ "WARNING:root:Skipping variant g.63721432del\n",
+ "WARNING:root:Skipping variant g.64591501_64591502insAGAA\n",
+ "WARNING:root:Skipping variant g.64590556_64590566del\n",
+ "WARNING:root:Skipping variant g.63999116del\n",
+ "WARNING:root:Skipping variant g.63720753_63720754dup\n",
+ "WARNING:root:Skipping variant g.(?_64945792)_(64945915_64997581)del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.63720730_63720733del\n",
+ "WARNING:root:Skipping variant g.63721377_63721384del\n",
+ "WARNING:root:Skipping variant g.63726524del\n",
+ "WARNING:root:Skipping variant g.64423168_64798957delinsATGA\n",
+ "WARNING:root:Skipping variant g.63942752_64337822delinsATTATG\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant g.?\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64423168_64798957delinsATGA\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.63942752_64337822delinsATTATG\n",
+ "WARNING:root:Skipping variant g.63957115_63958454del\n",
+ "WARNING:root:Skipping variant g.65001113_65005820del\n",
+ "WARNING:root:Skipping variant g.65550144_65552138del\n",
+ "WARNING:root:Skipping variant g.65689153_65694794del\n",
+ "WARNING:root:Skipping variant g.65454073_65454074insN[305]\n",
+ "WARNING:root:Skipping variant g.64296539_64296632del\n",
+ "WARNING:root:Skipping variant g.65204982_65205044del\n",
+ "WARNING:root:Skipping variant g.65564961_65565284del\n",
+ "WARNING:root:Skipping variant :g.64295412_64295413insN[118]\n",
+ "WARNING:root:Skipping variant g.65278328_65278329insN[59]\n",
+ "WARNING:root:Skipping variant g.64590911dup\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64590875_64590876insTCTT\n",
+ "WARNING:root:Skipping variant g.63720947_63720948insT\n",
+ "WARNING:root:Skipping variant g.64591501_64591502insAGAA\n",
+ "WARNING:root:Skipping variant g.63721432del\n",
+ "WARNING:root:Skipping variant g.64590556_64590566del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.65658176_65718924del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant NM_001142800.2:c.6079-2A>G\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.63999116del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.64986218_65013355del\n",
+ "WARNING:root:Skipping variant g.64388690_64388840del\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant g.(?_63719980)_(63726681_63762460)dup\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.65274506_65316845delinsAGATCA\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.65494100_65508832del\n",
+ "WARNING:root:Skipping variant g.65213025_65296862delinsGTTTTCTTTTTA\n",
+ "WARNING:root:Skipping variant g.64066349del\n",
+ "WARNING:root:Skipping variant g.64602159_64657461dup\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.63762589del\n",
+ "WARNING:root:Skipping variant g.65383303_65441305delinsAACTTTTACT\n",
+ "WARNING:root:Skipping variant g.63720737_63720746del\n",
+ "WARNING:root:Skipping variant g.65284957_66872862delinsT\n",
+ "WARNING:root:Skipping variant g.64122444_64129159delins64204448_64235506inv\n",
+ "WARNING:root:Skipping variant g.64937848_64948401delins[64944099_64944163inv;CAATTTTGTAT]\n",
+ "WARNING:root:Skipping variant g.63721385_63721386del\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.63720654_63720657del\n",
+ "WARNING:root:Skipping variant g.64591069_64591081del\n",
+ "WARNING:root:Skipping variant g.64886841del\n",
+ "WARNING:root:Skipping variant g.64790603_64977512del\n",
+ "WARNING:root:Skipping variant g.63721625dup\n",
+ "WARNING:root:Skipping variant g.64591514_64591520del\n",
+ "WARNING:root:Skipping variant g.63720649_63720653del\n",
+ "WARNING:root:Skipping variant g.65479942_67131267inv\n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n",
+ "WARNING:root:Skipping variant \n"
+ ]
+ }
+ ],
+ "source": [
+ "save_lovd_as_vcf(data[\"Variants_On_Genome\"], \"./lovd.vcf\")"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 4,
+ "id": "c7ff16903e0c52bd",
+ "metadata": {
+ "ExecuteTime": {
+ "end_time": "2024-05-13T15:58:47.868055Z",
+ "start_time": "2024-05-13T15:58:41.380466Z"
+ }
+ },
+ "outputs": [
+ {
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "2024-05-13 18:58:41.794056: I tensorflow/core/util/port.cc:113] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.\n",
+ "2024-05-13 18:58:41.794769: I external/local_tsl/tsl/cuda/cudart_stub.cc:32] Could not find cuda drivers on your machine, GPU will not be used.\n",
+ "2024-05-13 18:58:41.797917: I external/local_tsl/tsl/cuda/cudart_stub.cc:32] Could not find cuda drivers on your machine, GPU will not be used.\n",
+ "2024-05-13 18:58:41.857361: I tensorflow/core/platform/cpu_feature_guard.cc:210] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
+ "To enable the following instructions: AVX2 AVX_VNNI FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
+ "2024-05-13 18:58:42.410244: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
+ "2024-05-13 18:58:42.957291: I external/local_xla/xla/stream_executor/cuda/cuda_executor.cc:998] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero. See more at https://github.com/torvalds/linux/blob/v6.0/Documentation/ABI/testing/sysfs-bus-pci#L344-L355\n",
+ "2024-05-13 18:58:42.957684: W tensorflow/core/common_runtime/gpu/gpu_device.cc:2251] Cannot dlopen some GPU libraries. Please make sure the missing libraries mentioned above are installed properly if you would like to use GPU. Follow the guide at https://www.tensorflow.org/install/gpu for how to download and setup the required libraries for your platform.\n",
+ "Skipping registering GPU devices...\n",
+ "WARNING:absl:No training configuration found in the save file, so the model was *not* compiled. Compile it manually.\n",
+ "WARNING:absl:No training configuration found in the save file, so the model was *not* compiled. Compile it manually.\n",
+ "WARNING:absl:No training configuration found in the save file, so the model was *not* compiled. Compile it manually.\n",
+ "WARNING:absl:No training configuration found in the save file, so the model was *not* compiled. Compile it manually.\n",
+ "WARNING:absl:No training configuration found in the save file, so the model was *not* compiled. Compile it manually.\n"
+ ]
+ },
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "\u001B[1m1/1\u001B[0m \u001B[32m━━━━━━━━━━━━━━━━━━━━\u001B[0m\u001B[37m\u001B[0m \u001B[1m1s\u001B[0m 595ms/step\n",
+ "\u001B[1m1/1\u001B[0m \u001B[32m━━━━━━━━━━━━━━━━━━━━\u001B[0m\u001B[37m\u001B[0m \u001B[1m1s\u001B[0m 554ms/step\n",
+ "\u001B[1m1/1\u001B[0m \u001B[32m━━━━━━━━━━━━━━━━━━━━\u001B[0m\u001B[37m\u001B[0m \u001B[1m1s\u001B[0m 553ms/step\n",
+ "\u001B[1m1/1\u001B[0m \u001B[32m━━━━━━━━━━━━━━━━━━━━\u001B[0m\u001B[37m\u001B[0m \u001B[1m1s\u001B[0m 548ms/step\n"
+ ]
+ },
+ {
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "WARNING:tensorflow:5 out of the last 5 calls to .one_step_on_data_distributed at 0x7dee981abf40> triggered tf.function retracing. Tracing is expensive and the excessive number of tracings could be due to (1) creating @tf.function repeatedly in a loop, (2) passing tensors with different shapes, (3) passing Python objects instead of tensors. For (1), please define your @tf.function outside of the loop. For (2), @tf.function has reduce_retracing=True option that can avoid unnecessary retracing. For (3), please refer to https://www.tensorflow.org/guide/function#controlling_retracing and https://www.tensorflow.org/api_docs/python/tf/function for more details.\n",
+ "WARNING:tensorflow:5 out of the last 5 calls to .one_step_on_data_distributed at 0x7dee981abf40> triggered tf.function retracing. Tracing is expensive and the excessive number of tracings could be due to (1) creating @tf.function repeatedly in a loop, (2) passing tensors with different shapes, (3) passing Python objects instead of tensors. For (1), please define your @tf.function outside of the loop. For (2), @tf.function has reduce_retracing=True option that can avoid unnecessary retracing. For (3), please refer to https://www.tensorflow.org/guide/function#controlling_retracing and https://www.tensorflow.org/api_docs/python/tf/function for more details.\n"
+ ]
+ },
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "\u001B[1m1/1\u001B[0m \u001B[32m━━━━━━━━━━━━━━━━━━━━\u001B[0m\u001B[37m\u001B[0m \u001B[1m1s\u001B[0m 548ms/step\n",
+ "\u001B[1m1/1\u001B[0m \u001B[32m━━━━━━━━━━━━━━━━━━━━\u001B[0m\u001B[37m\u001B[0m \u001B[1m0s\u001B[0m 49ms/step\n",
+ "\u001B[1m1/1\u001B[0m \u001B[32m━━━━━━━━━━━━━━━━━━━━\u001B[0m\u001B[37m\u001B[0m \u001B[1m0s\u001B[0m 51ms/step\n",
+ "\u001B[1m1/1\u001B[0m \u001B[32m━━━━━━━━━━━━━━━━━━━━\u001B[0m\u001B[37m\u001B[0m \u001B[1m0s\u001B[0m 51ms/step\n",
+ "\u001B[1m1/1\u001B[0m \u001B[32m━━━━━━━━━━━━━━━━━━━━\u001B[0m\u001B[37m\u001B[0m \u001B[1m0s\u001B[0m 59ms/step\n",
+ "\u001B[1m1/1\u001B[0m \u001B[32m━━━━━━━━━━━━━━━━━━━━\u001B[0m\u001B[37m\u001B[0m \u001B[1m0s\u001B[0m 53ms/step\n"
+ ]
+ },
+ {
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "WARNING:root:dede['G|EYS|0.00|0.00|0.00|0.00|3|9|-20|9']\n"
+ ]
+ },
+ {
+ "data": {
+ "text/plain": [
+ "0"
+ ]
+ },
+ "execution_count": 4,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "from subprocess import Popen\n",
+ "\n",
+ "\n",
+ "process = Popen(\"spliceai -I ./lovd.vcf -O ./lovd_output.vcf -R ../tools/spliceai/hg38.fa -A grch38\".split())\n",
+ "process.wait()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 1,
+ "id": "0514ccc3-5c91-41ad-ab15-f4158030ea14",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "/home/nojsaj/kath/tools/revel/revel.py:9: DtypeWarning: Columns (0,2) have mixed types. Specify dtype option on import or set low_memory=False.\n",
+ " revel_data = pd.read_csv(revel_file)\n"
+ ]
+ },
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " chr | \n",
+ " hg19_pos | \n",
+ " grch38_pos | \n",
+ " ref | \n",
+ " alt | \n",
+ " aaref | \n",
+ " aaalt | \n",
+ " REVEL | \n",
+ " Ensembl_transcriptid | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 28756127 | \n",
+ " 6 | \n",
+ " 65655758 | \n",
+ " 64945865 | \n",
+ " T | \n",
+ " A | \n",
+ " Q | \n",
+ " L | \n",
+ " 0.188 | \n",
+ " ENST00000503581;ENST00000370621;ENST00000370616 | \n",
+ "
\n",
+ " \n",
+ " 28756128 | \n",
+ " 6 | \n",
+ " 65655758 | \n",
+ " 64945865 | \n",
+ " T | \n",
+ " C | \n",
+ " Q | \n",
+ " R | \n",
+ " 0.111 | \n",
+ " ENST00000503581;ENST00000370621;ENST00000370616 | \n",
+ "
\n",
+ " \n",
+ " 28756129 | \n",
+ " 6 | \n",
+ " 65655758 | \n",
+ " 64945865 | \n",
+ " T | \n",
+ " G | \n",
+ " Q | \n",
+ " P | \n",
+ " 0.344 | \n",
+ " ENST00000503581;ENST00000370621;ENST00000370616 | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " chr hg19_pos grch38_pos ref alt aaref aaalt REVEL \\\n",
+ "28756127 6 65655758 64945865 T A Q L 0.188 \n",
+ "28756128 6 65655758 64945865 T C Q R 0.111 \n",
+ "28756129 6 65655758 64945865 T G Q P 0.344 \n",
+ "\n",
+ " Ensembl_transcriptid \n",
+ "28756127 ENST00000503581;ENST00000370621;ENST00000370616 \n",
+ "28756128 ENST00000503581;ENST00000370621;ENST00000370616 \n",
+ "28756129 ENST00000503581;ENST00000370621;ENST00000370616 "
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ }
+ ],
+ "source": [
+ "from tools import get_revel_scores\n",
+ "\n",
+ "chromosome = 6\n",
+ "position = 65655758\n",
+ "\n",
+ "results = get_revel_scores(chromosome, position)\n",
+ "\n",
+ "display(results)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "outputs": [],
+ "source": [
+ "from api.data.collection import store_database_for_eys_gene\n",
+ "store_database_for_eys_gene(\"clinvar\", override=False)"
+ ],
+ "metadata": {
+ "collapsed": false,
+ "ExecuteTime": {
+ "end_time": "2024-08-12T16:46:07.973915Z",
+ "start_time": "2024-08-12T16:46:07.970874Z"
+ }
+ },
+ "id": "b80a1049abe7596e",
+ "execution_count": 12
+ },
+ {
+ "cell_type": "code",
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "The file at ../data/lovd/lovd_data.txt already exists.\n"
+ ]
+ }
+ ],
+ "source": [
+ "from api.data.collection import store_database_for_eys_gene\n",
+ "store_database_for_eys_gene(\"lovd\", override=False)"
+ ],
+ "metadata": {
+ "collapsed": false,
+ "ExecuteTime": {
+ "end_time": "2024-08-12T16:47:56.094297Z",
+ "start_time": "2024-08-12T16:47:56.090300Z"
+ }
+ },
+ "id": "a1e10fc8175753a0",
+ "execution_count": 4
+ },
+ {
+ "cell_type": "code",
+ "outputs": [
+ {
+ "data": {
+ "text/plain": " gnomAD ID Chromosome Position rsIDs Reference \\\n0 6-63720525-A-G 6 63720525 rs1768331164 A \n1 6-63720525-A-T 6 63720525 rs1768331164 A \n2 6-63720526-T-A 6 63720526 T \n3 6-63720531-C-CAA 6 63720531 C \n4 6-63720531-C-G 6 63720531 rs927390284 C \n... ... ... ... ... ... \n11083 6-65495478-G-A 6 65495478 rs530118054 G \n11084 6-65495479-G-A 6 65495479 rs1766225632 G \n11085 6-65495482-A-G 6 65495482 rs1766225707 A \n11086 6-65495484-T-G 6 65495484 rs1766225807 T \n11087 6-65495485-T-C 6 65495485 T \n\n Alternate Source Filters - exomes \\\n0 G gnomAD Exomes,gnomAD Genomes PASS \n1 T gnomAD Genomes \n2 A gnomAD Exomes PASS \n3 CAA gnomAD Exomes PASS \n4 G gnomAD Exomes,gnomAD Genomes PASS \n... ... ... ... \n11083 A gnomAD Exomes,gnomAD Genomes PASS \n11084 A gnomAD Exomes PASS \n11085 G gnomAD Exomes,gnomAD Genomes PASS \n11086 G gnomAD Exomes PASS \n11087 C gnomAD Exomes PASS \n\n Filters - genomes Transcript ... Homozygote Count Amish \\\n0 PASS ENST00000503581.6 ... 0 \n1 PASS ENST00000503581.6 ... 0 \n2 ENST00000503581.6 ... 0 \n3 ENST00000503581.6 ... 0 \n4 PASS ENST00000503581.6 ... 0 \n... ... ... ... ... \n11083 PASS ENST00000503581.6 ... 0 \n11084 ENST00000503581.6 ... 0 \n11085 PASS ENST00000503581.6 ... 0 \n11086 ENST00000503581.6 ... 0 \n11087 ENST00000503581.6 ... 0 \n\n Hemizygote Count Amish Allele Count South Asian \\\n0 0 0 \n1 0 0 \n2 0 1 \n3 0 0 \n4 0 0 \n... ... ... \n11083 0 4 \n11084 0 0 \n11085 0 0 \n11086 0 5 \n11087 0 1 \n\n Allele Number South Asian Homozygote Count South Asian \\\n0 55362 0 \n1 55362 0 \n2 55360 0 \n3 57520 0 \n4 57524 0 \n... ... ... \n11083 88352 0 \n11084 88316 0 \n11085 87828 0 \n11086 87818 0 \n11087 87636 0 \n\n Hemizygote Count South Asian Allele Count Remaining \\\n0 0 0 \n1 0 0 \n2 0 0 \n3 0 1 \n4 0 0 \n... ... ... \n11083 0 8 \n11084 0 0 \n11085 0 0 \n11086 0 0 \n11087 0 0 \n\n Allele Number Remaining Homozygote Count Remaining \\\n0 44082 0 \n1 44082 0 \n2 44162 0 \n3 47700 0 \n4 47678 0 \n... ... ... \n11083 60164 0 \n11084 60142 0 \n11085 59586 0 \n11086 59748 0 \n11087 59608 0 \n\n Hemizygote Count Remaining \n0 0 \n1 0 \n2 0 \n3 0 \n4 0 \n... ... \n11083 0 \n11084 0 \n11085 0 \n11086 0 \n11087 0 \n\n[11088 rows x 72 columns]",
+ "text/html": "\n\n
\n \n \n | \n gnomAD ID | \n Chromosome | \n Position | \n rsIDs | \n Reference | \n Alternate | \n Source | \n Filters - exomes | \n Filters - genomes | \n Transcript | \n ... | \n Homozygote Count Amish | \n Hemizygote Count Amish | \n Allele Count South Asian | \n Allele Number South Asian | \n Homozygote Count South Asian | \n Hemizygote Count South Asian | \n Allele Count Remaining | \n Allele Number Remaining | \n Homozygote Count Remaining | \n Hemizygote Count Remaining | \n
\n \n \n \n 0 | \n 6-63720525-A-G | \n 6 | \n 63720525 | \n rs1768331164 | \n A | \n G | \n gnomAD Exomes,gnomAD Genomes | \n PASS | \n PASS | \n ENST00000503581.6 | \n ... | \n 0 | \n 0 | \n 0 | \n 55362 | \n 0 | \n 0 | \n 0 | \n 44082 | \n 0 | \n 0 | \n
\n \n 1 | \n 6-63720525-A-T | \n 6 | \n 63720525 | \n rs1768331164 | \n A | \n T | \n gnomAD Genomes | \n <NA> | \n PASS | \n ENST00000503581.6 | \n ... | \n 0 | \n 0 | \n 0 | \n 55362 | \n 0 | \n 0 | \n 0 | \n 44082 | \n 0 | \n 0 | \n
\n \n 2 | \n 6-63720526-T-A | \n 6 | \n 63720526 | \n <NA> | \n T | \n A | \n gnomAD Exomes | \n PASS | \n <NA> | \n ENST00000503581.6 | \n ... | \n 0 | \n 0 | \n 1 | \n 55360 | \n 0 | \n 0 | \n 0 | \n 44162 | \n 0 | \n 0 | \n
\n \n 3 | \n 6-63720531-C-CAA | \n 6 | \n 63720531 | \n <NA> | \n C | \n CAA | \n gnomAD Exomes | \n PASS | \n <NA> | \n ENST00000503581.6 | \n ... | \n 0 | \n 0 | \n 0 | \n 57520 | \n 0 | \n 0 | \n 1 | \n 47700 | \n 0 | \n 0 | \n
\n \n 4 | \n 6-63720531-C-G | \n 6 | \n 63720531 | \n rs927390284 | \n C | \n G | \n gnomAD Exomes,gnomAD Genomes | \n PASS | \n PASS | \n ENST00000503581.6 | \n ... | \n 0 | \n 0 | \n 0 | \n 57524 | \n 0 | \n 0 | \n 0 | \n 47678 | \n 0 | \n 0 | \n
\n \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n
\n \n 11083 | \n 6-65495478-G-A | \n 6 | \n 65495478 | \n rs530118054 | \n G | \n A | \n gnomAD Exomes,gnomAD Genomes | \n PASS | \n PASS | \n ENST00000503581.6 | \n ... | \n 0 | \n 0 | \n 4 | \n 88352 | \n 0 | \n 0 | \n 8 | \n 60164 | \n 0 | \n 0 | \n
\n \n 11084 | \n 6-65495479-G-A | \n 6 | \n 65495479 | \n rs1766225632 | \n G | \n A | \n gnomAD Exomes | \n PASS | \n <NA> | \n ENST00000503581.6 | \n ... | \n 0 | \n 0 | \n 0 | \n 88316 | \n 0 | \n 0 | \n 0 | \n 60142 | \n 0 | \n 0 | \n
\n \n 11085 | \n 6-65495482-A-G | \n 6 | \n 65495482 | \n rs1766225707 | \n A | \n G | \n gnomAD Exomes,gnomAD Genomes | \n PASS | \n PASS | \n ENST00000503581.6 | \n ... | \n 0 | \n 0 | \n 0 | \n 87828 | \n 0 | \n 0 | \n 0 | \n 59586 | \n 0 | \n 0 | \n
\n \n 11086 | \n 6-65495484-T-G | \n 6 | \n 65495484 | \n rs1766225807 | \n T | \n G | \n gnomAD Exomes | \n PASS | \n <NA> | \n ENST00000503581.6 | \n ... | \n 0 | \n 0 | \n 5 | \n 87818 | \n 0 | \n 0 | \n 0 | \n 59748 | \n 0 | \n 0 | \n
\n \n 11087 | \n 6-65495485-T-C | \n 6 | \n 65495485 | \n <NA> | \n T | \n C | \n gnomAD Exomes | \n PASS | \n <NA> | \n ENST00000503581.6 | \n ... | \n 0 | \n 0 | \n 1 | \n 87636 | \n 0 | \n 0 | \n 0 | \n 59608 | \n 0 | \n 0 | \n
\n \n
\n
11088 rows × 72 columns
\n
"
+ },
+ "execution_count": 1,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "from api.data.refactoring import parse_gnomad, set_gnomad_dtypes\n",
+ "from api import (store_database_for_eys_gene,GNOMAD_PATH)\n",
+ "\n",
+ "store_database_for_eys_gene('gnomad', False)\n",
+ "\n",
+ "gnomad_data = parse_gnomad(GNOMAD_PATH+'/gnomad_data.csv')\n",
+ "\n",
+ "set_gnomad_dtypes(gnomad_data)\n",
+ "\n",
+ "gnomad_data"
+ ],
+ "metadata": {
+ "collapsed": false,
+ "ExecuteTime": {
+ "end_time": "2024-08-20T18:43:31.996838Z",
+ "start_time": "2024-08-20T18:43:30.905943Z"
+ }
+ },
+ "id": "4ba7fd02a60f5693",
+ "execution_count": 1
+ },
+ {
+ "cell_type": "code",
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "The file at ../data/lovd/lovd_data.txt already exists.\n"
+ ]
+ },
+ {
+ "data": {
+ "text/plain": " id transcriptid effectid position_c_start \\\n0 170936 7329 90 -538 \n1 235579 7329 99 -332 \n2 235593 7329 99 1300 \n3 235595 7329 99 1300 \n4 235603 7329 99 6572 \n... ... ... ... ... \n13272 822052 7329 70 1767 \n13273 822775 7329 70 0 \n13274 822785 7329 70 0 \n13275 822816 7329 70 0 \n13276 867648 7329 70 0 \n\n position_c_start_intron position_c_end position_c_end_intron \\\n0 0 1599 1 \n1 -1 748 1 \n2 -1 1459 1 \n3 -1 1459 1 \n4 -1 6725 1 \n... ... ... ... \n13272 -1 2023 1 \n13273 0 0 0 \n13274 0 0 0 \n13275 0 0 0 \n13276 0 0 0 \n\n VariantOnTranscript/DNA VariantOnTranscript/RNA \\\n0 c.(?_-538)_(1599+1_1600-1)del r.0? \n1 c.(-333+1_-332-1)_(748+1_749-1)del r.? \n2 c.(1299+1_1300-1)_(1459+1_1460-1)del r.? \n3 c.(1299+1_1300-1)_(1459+1_1460-1)del r.(?) \n4 c.(6571+1_6572-1)_(6725+1_6726-1)del r.? \n... ... ... \n13272 c.(1766+1_1767-1)_(2023+1_2024-1)del r.spl \n13273 c.? r.(?) \n13274 c.? r.(?) \n13275 c.? r.(?) \n13276 c.? r.(?) \n\n VariantOnTranscript/Protein VariantOnTranscript/Exon \\\n0 p.0? _1_10i \n1 p.? 2i_4i \n2 p.? 8i_9i \n3 p.? 8i_9i \n4 p.(Ser2191Thrfs*14) 32i_33i \n... ... ... \n13272 p.(?) \n13273 p.(Tyr2555fs) \n13274 p.(Asp498fs) \n13275 p.(Gln3101fs) \n13276 p.? \n\n VariantOnGenome/DNA/hg38 gnomAD ID_gnomad hg38_gnomad \n0 \n1 \n2 \n3 \n4 \n... ... ... ... \n13272 g.? \n13273 g.? \n13274 g.? \n13275 g.? \n13276 g.? \n\n[13277 rows x 14 columns]",
+ "text/html": "\n\n
\n \n \n | \n id | \n transcriptid | \n effectid | \n position_c_start | \n position_c_start_intron | \n position_c_end | \n position_c_end_intron | \n VariantOnTranscript/DNA | \n VariantOnTranscript/RNA | \n VariantOnTranscript/Protein | \n VariantOnTranscript/Exon | \n VariantOnGenome/DNA/hg38 | \n gnomAD ID_gnomad | \n hg38_gnomad | \n
\n \n \n \n 0 | \n 170936 | \n 7329 | \n 90 | \n -538 | \n 0 | \n 1599 | \n 1 | \n c.(?_-538)_(1599+1_1600-1)del | \n r.0? | \n p.0? | \n _1_10i | \n | \n <NA> | \n <NA> | \n
\n \n 1 | \n 235579 | \n 7329 | \n 99 | \n -332 | \n -1 | \n 748 | \n 1 | \n c.(-333+1_-332-1)_(748+1_749-1)del | \n r.? | \n p.? | \n 2i_4i | \n | \n <NA> | \n <NA> | \n
\n \n 2 | \n 235593 | \n 7329 | \n 99 | \n 1300 | \n -1 | \n 1459 | \n 1 | \n c.(1299+1_1300-1)_(1459+1_1460-1)del | \n r.? | \n p.? | \n 8i_9i | \n | \n <NA> | \n <NA> | \n
\n \n 3 | \n 235595 | \n 7329 | \n 99 | \n 1300 | \n -1 | \n 1459 | \n 1 | \n c.(1299+1_1300-1)_(1459+1_1460-1)del | \n r.(?) | \n p.? | \n 8i_9i | \n | \n <NA> | \n <NA> | \n
\n \n 4 | \n 235603 | \n 7329 | \n 99 | \n 6572 | \n -1 | \n 6725 | \n 1 | \n c.(6571+1_6572-1)_(6725+1_6726-1)del | \n r.? | \n p.(Ser2191Thrfs*14) | \n 32i_33i | \n | \n <NA> | \n <NA> | \n
\n \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n ... | \n
\n \n 13272 | \n 822052 | \n 7329 | \n 70 | \n 1767 | \n -1 | \n 2023 | \n 1 | \n c.(1766+1_1767-1)_(2023+1_2024-1)del | \n r.spl | \n p.(?) | \n | \n g.? | \n <NA> | \n <NA> | \n
\n \n 13273 | \n 822775 | \n 7329 | \n 70 | \n 0 | \n 0 | \n 0 | \n 0 | \n c.? | \n r.(?) | \n p.(Tyr2555fs) | \n | \n g.? | \n <NA> | \n <NA> | \n
\n \n 13274 | \n 822785 | \n 7329 | \n 70 | \n 0 | \n 0 | \n 0 | \n 0 | \n c.? | \n r.(?) | \n p.(Asp498fs) | \n | \n g.? | \n <NA> | \n <NA> | \n
\n \n 13275 | \n 822816 | \n 7329 | \n 70 | \n 0 | \n 0 | \n 0 | \n 0 | \n c.? | \n r.(?) | \n p.(Gln3101fs) | \n | \n g.? | \n <NA> | \n <NA> | \n
\n \n 13276 | \n 867648 | \n 7329 | \n 70 | \n 0 | \n 0 | \n 0 | \n 0 | \n c.? | \n r.(?) | \n p.? | \n | \n g.? | \n <NA> | \n <NA> | \n
\n \n
\n
13277 rows × 14 columns
\n
"
+ },
+ "execution_count": 1,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "from api.data.refactoring import merge_gnomad_lovd, parse_gnomad, set_gnomad_dtypes\n",
+ "import pandas as pd\n",
+ "from api import (store_database_for_eys_gene,\n",
+ " parse_lovd,\n",
+ " set_lovd_dtypes,\n",
+ " LOVD_PATH,\n",
+ " GNOMAD_PATH)\n",
+ "\n",
+ "store_database_for_eys_gene('lovd', False)\n",
+ "store_database_for_eys_gene('gnomad', False)\n",
+ "\n",
+ "lovd_data = parse_lovd(LOVD_PATH + \"/lovd_data.txt\")\n",
+ "gnomad_data = parse_gnomad(GNOMAD_PATH+'/gnomad_data.csv')\n",
+ "\n",
+ "set_lovd_dtypes(lovd_data)\n",
+ "set_gnomad_dtypes(gnomad_data)\n",
+ "\n",
+ "variants_on_genome = lovd_data[\"Variants_On_Genome\"].copy()\n",
+ "\n",
+ "lovd_data = pd.merge(lovd_data[\"Variants_On_Transcripts\"],\n",
+ " variants_on_genome[['id','VariantOnGenome/DNA/hg38']],\n",
+ " on='id',\n",
+ " how='left')\n",
+ "\n",
+ "gnomad_data = gnomad_data.copy()\n",
+ "final_data = merge_gnomad_lovd(lovd_data, gnomad_data)\n",
+ "final_data"
+ ],
+ "metadata": {
+ "collapsed": false,
+ "ExecuteTime": {
+ "end_time": "2024-08-21T18:35:42.249375Z",
+ "start_time": "2024-08-21T18:35:33.312752Z"
+ }
+ },
+ "id": "dd9b17623f26a07c",
+ "execution_count": 1
+ },
+ {
+ "cell_type": "code",
+ "outputs": [],
+ "source": [],
+ "metadata": {
+ "collapsed": false
+ },
+ "id": "1a3b6e41853817ca",
+ "execution_count": null
+ }
+ ],
+ "metadata": {
+ "kernelspec": {
+ "display_name": "Python 3 (ipykernel)",
+ "language": "python",
+ "name": "python3"
+ },
+ "language_info": {
+ "codemirror_mode": {
+ "name": "ipython",
+ "version": 3
+ },
+ "file_extension": ".py",
+ "mimetype": "text/x-python",
+ "name": "python",
+ "nbconvert_exporter": "python",
+ "pygments_lexer": "ipython3",
+ "version": "3.11.6"
+ }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}