{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import pandas as pd" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [], "source": [ "import re \n", "\n", "def sorted_nicely( l ): \n", " \"\"\" Sort the given iterable in the way that humans expect.\"\"\" \n", " convert = lambda text: int(text) if text.isdigit() else text \n", " alphanum_key = lambda key: [ convert(c) for c in re.split('([0-9]+)', key) ] \n", " return sorted(l, key = alphanum_key)" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "import h5py\n", "import logging\n", "import numpy as np\n", "\n", "import pandas as pd\n", "from scipy import stats, sparse\n", "import bottleneck\n", "#%matplotlib notebook\n", "%matplotlib inline\n", "#import matplotlib\n", "#matplotlib.use('Agg')\n", "import matplotlib.pyplot as plt\n", "import matplotlib.ticker as plticker\n", "\n", "from scipy.sparse import csr_matrix\n", "\n", "from scipy import sparse\n", "#import pickle\n", "import numpy as np\n", "import pandas as pd\n", "from scipy import sparse\n", "from scipy.sparse import csr_matrix" ] }, { "cell_type": "code", "execution_count": 32, "metadata": {}, "outputs": [], "source": [ "def run_egad(go, nw, **kwargs):\n", " \"\"\"EGAD running function\n", " \n", " Wrapper to lower level functions for EGAD\n", "\n", " EGAD measures modularity of gene lists in co-expression networks. \n", "\n", " This was translated from the MATLAB version, which does tiled Cross Validation\n", " \n", " The useful kwargs are:\n", " int - nFold : Number of CV folds to do, default is 3, \n", " int - {min,max}_count : limits for number of terms in each gene list, these are exclusive values\n", "\n", "\n", " Arguments:\n", " go {pd.DataFrame} -- dataframe of genes x terms of values [0,1], where 1 is included in gene lists\n", " nw {pd.DataFrame} -- dataframe of co-expression network, genes x genes\n", " **kwargs \n", " \n", " Returns:\n", " pd.DataFrame -- dataframe of terms x metrics where the metrics are \n", " ['AUC', 'AVG_NODE_DEGREE', 'DEGREE_NULL_AUC', 'P_Value']\n", " \"\"\"\n", " assert nw.shape[0] == nw.shape[1] , 'Network is not square'\n", " #print(nw.index)\n", " #nw.columns = nw.columns.astype(int)\n", " #print(nw.columns.astype(int))\n", " assert np.all(nw.index == nw.columns) , 'Network index and columns are not in the same order'\n", "\n", " #nw_mask = nw.isna().sum(axis=1) != nw.shape[1]\n", " #nw = nw.loc[nw_mask, nw_mask].astype('float')\n", " #np.fill_diagonal(nw.values, 1)\n", " return _runNV(go, nw, **kwargs)\n", "\n", "def _runNV(go, nw, nFold=3, min_count=1, max_count=1807):\n", "\n", " #Make sure genes are same in go and nw\n", " #go.index = go.index.map(str) \n", " #nw.index = nw.index.map(str)\n", " #nw.index = nw.index.str.replace('_', '')\n", " #go.index = go.index.str.replace('_', '')\n", " print (nw)\n", " genes_intersect = go.index.intersection(nw.index)\n", "\n", "\n", " print (genes_intersect)\n", " go = go.loc[genes_intersect, :]\n", " nw = nw.loc[genes_intersect, genes_intersect]\n", " print (go)\n", " print (nw.shape)\n", " print (go.shape)\n", " sparsity = 1.0 - np.count_nonzero(go) / go.size\n", " print (sparsity)\n", " sparsity = 1.0 - np.count_nonzero(nw) / nw.size\n", " print (sparsity)\n", " #print(nw\n", " #print(go\n", " nw_mask = nw.isna().sum(axis=1) != nw.shape[1]\n", " nw = nw.loc[nw_mask, nw_mask].astype('float')\n", " np.fill_diagonal(nw.values, 1)\n", " #Make sure there aren't duplicates\n", " duplicates = nw.index.duplicated(keep='first')\n", " nw = nw.loc[~duplicates, ~duplicates]\n", "\n", " go = go.loc[:, (go.sum(axis=0) > min_count) & (go.sum(axis=0) < max_count)]\n", " go = go.loc[~go.index.duplicated(keep='first'), :]\n", " print(go.sum(axis=0))\n", "\n", " roc = _new_egad(go.values, nw.values, nFold)\n", "\n", " col_names = ['AUC', 'AVG_NODE_DEGREE', 'DEGREE_NULL_AUC', 'P_Value']\n", " #Put output in dataframe\n", " return pd.DataFrame(dict(zip(col_names, roc)), index=go.columns)\n", "\n", "def _new_egad(go, nw, nFold):\n", "\n", " #Build Cross validated Positive\n", " x, y = np.where(go)\n", " #print(x, y)\n", " cvgo = {}\n", " for i in np.arange(nFold):\n", " a = x[i::nFold]\n", " #print(a)\n", " b = y[i::nFold]\n", " dat = np.ones_like(a)\n", " mask = sparse.coo_matrix((dat, (a, b)), shape=go.shape)\n", " cvgo[i] = go - mask.toarray()\n", "\n", " CVgo = np.concatenate(list(cvgo.values()), axis=1)\n", " #print(CVgo)\n", "\n", " sumin = np.matmul(nw.T, CVgo)\n", "\n", " degree = np.sum(nw, axis=0)\n", " #print(degree)\n", " #print(degree[:, None])\n", "\n", " predicts = sumin / degree[:, None]\n", " #print(predicts)\n", "\n", " np.place(predicts, CVgo > 0, np.nan)\n", "\n", " #print(predicts)\n", "\n", " #Calculate ranks of positives\n", " rank_abs = lambda x: stats.rankdata(np.abs(x))\n", " predicts2 = np.apply_along_axis(rank_abs, 0, predicts)\n", " #print(predicts2)\n", "\n", " #Masking Nans that were ranked (how tiedrank works in matlab)\n", " predicts2[np.isnan(predicts)] = np.nan\n", " #print(predicts2)\n", "\n", " filtering = np.tile(go, nFold)\n", " #print(filtering)\n", "\n", " #negatives :filtering == 0\n", " #Sets Ranks of negatives to 0\n", " np.place(predicts2, filtering == 0, 0)\n", "\n", " #Sum of ranks for each prediction\n", " p = bottleneck.nansum(predicts2, axis=0)\n", " n_p = np.sum(filtering, axis=0) - np.sum(CVgo, axis=0)\n", "\n", " #Number of negatives\n", " #Number of GO terms - number of postiive\n", " n_n = filtering.shape[0] - np.sum(filtering, axis=0)\n", "\n", " roc = (p / n_p - (n_p + 1) / 2) / n_n\n", " U = roc * n_p * n_n\n", " Z = (np.abs(U - (n_p * n_n / 2))) / np.sqrt(n_p * n_n *\n", " (n_p + n_n + 1) / 12)\n", " roc = roc.reshape(nFold, go.shape[1])\n", " Z = Z.reshape(nFold, go.shape[1])\n", " #Stouffer Z method\n", " Z = bottleneck.nansum(Z, axis=0) / np.sqrt(nFold)\n", " #Calc ROC of Neighbor Voting\n", " roc = bottleneck.nanmean(roc, axis=0)\n", " P = stats.norm.sf(Z)\n", "\n", " #Average degree for nodes in each go term\n", " avg_degree = degree.dot(go) / np.sum(go, axis=0)\n", "\n", " #Calc null auc for degree\n", " ranks = np.tile(stats.rankdata(degree), (go.shape[1], 1)).T\n", "\n", " np.place(ranks, go == 0, 0)\n", "\n", " n_p = bottleneck.nansum(go, axis=0)\n", " nn = go.shape[0] - n_p\n", " p = bottleneck.nansum(ranks, axis=0)\n", "\n", " roc_null = (p / n_p - ((n_p + 1) / 2)) / nn\n", " #print(roc)\n", " return roc, avg_degree, roc_null, P\n", "\n", "\n", "#reads the go_prop file\n", "#pickle_in = open('gotermindex.pickle','rb')" ] }, { "cell_type": "code", "execution_count": 216, "metadata": {}, "outputs": [], "source": [ "from scipy.sparse import coo_matrix\n", "#Data handling\n", "import h5py\n", "\n", "import logging\n", "#Mathematical libraries\n", "import numpy as np\n", "\n", "import pandas as pd\n", "\n", "%matplotlib inline\n", "\n", "import bottleneck\n", "\n", "import matplotlib.pyplot as plt\n", "#df_go_id_enseml = pd.read_csv('/data/johlee/geneIDConversions/9606_gene_info.tab', sep='\\t') #this file has a lot of mapping, EntrezID, uniprot, Ensembl ID, genename\n", "#df_go_id_enseml.dropna(subset=['EnsemblID'])\n", "#mydict_EID_UID = dict(zip(df_go_id_enseml.EnsemblID, df_go_id_enseml.UniProtID))\n", "def parse_go_hd5(filename):\n", " \"\"\"\n", " Loads data in file to dataframe.\n", " \"\"\"\n", " with h5py.File(filename, 'r') as f:\n", " col_uid = []\n", " logging.debug(\"reading matrix...\")\n", " row = [ s.decode() for s in f['GO'][:] ]\n", " columns = [ s.decode() for s in f['genes'][:] ]\n", " matrix = f['ind'][:] - 1 #the indices in this matrix are stored from 1 \n", " coo = coo_matrix(( np.ones(1901323) , (matrix[0,:],matrix[1,:] )), shape=(len(columns), len(row)) )\n", " logging.debug(\"reading columns. converting to unicode\")\n", " for x in columns:\n", " try:\n", " col_uid.append(x)\n", " except KeyError:\n", " print (x)\n", " col_uid.append('del')\n", " #col_uid = [mydict_EID_UID[x] for x in columns]\n", " logging.debug(\"making dataframe...\")\n", "\n", " print (coo.toarray().shape)\n", " df = pd.DataFrame(coo.toarray(), index=col_uid, columns = row )\n", " return df\n" ] }, { "cell_type": "code", "execution_count": 217, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "(19016, 22517)\n" ] } ], "source": [ "go_df = parse_go_hd5(\"/data/johlee/CoCoCoNet/gene2go/human_gene2go.hdf5\")\n", "duplicates = go_df.index.duplicated(keep='first')\n", "go_df = go_df.loc[~duplicates, :]" ] }, { "cell_type": "code", "execution_count": 12, "metadata": {}, "outputs": [], "source": [ "from lohia_utilities.load_lee_matrix import parse_expression_hd5_lee\n", "exp_file = parse_expression_hd5_lee(\"/data/johlee/CoCoCoNet/networks/human_prioAggNet.hdf5\")" ] }, { "cell_type": "code", "execution_count": 26, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | ENSG00000278267 | \n", "ENSG00000233750 | \n", "ENSG00000268903 | \n", "ENSG00000269981 | \n", "ENSG00000241860 | \n", "ENSG00000279928 | \n", "ENSG00000279457 | \n", "ENSG00000228463 | \n", "ENSG00000237094 | \n", "ENSG00000225972 | \n", "... | \n", "ENSG00000275594 | \n", "ENSG00000276497 | \n", "ENSG00000273850 | \n", "ENSG00000271254 | \n", "ENSG00000275405 | \n", "ENSG00000276345 | \n", "ENSG00000277856 | \n", "ENSG00000275063 | \n", "ENSG00000278817 | \n", "ENSG00000277196 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
ENSG00000278267 | \n", "1.000000 | \n", "0.343890 | \n", "0.487717 | \n", "0.504516 | \n", "0.479969 | \n", "0.343116 | \n", "0.896050 | \n", "0.229694 | \n", "0.550274 | \n", "0.208983 | \n", "... | \n", "0.089306 | \n", "0.275199 | \n", "0.708864 | \n", "0.491642 | \n", "0.013446 | \n", "0.085152 | \n", "0.025113 | \n", "0.005367 | \n", "0.458116 | \n", "0.389884 | \n", "
ENSG00000233750 | \n", "0.343890 | \n", "1.000000 | \n", "0.860658 | \n", "0.809451 | \n", "0.673940 | \n", "0.028341 | \n", "0.463029 | \n", "0.399338 | \n", "0.764022 | \n", "0.018238 | \n", "... | \n", "0.042306 | \n", "0.004487 | \n", "0.202850 | \n", "0.146670 | \n", "0.028417 | \n", "0.055478 | \n", "0.045883 | \n", "0.013963 | \n", "0.154940 | \n", "0.049407 | \n", "
ENSG00000268903 | \n", "0.487717 | \n", "0.860658 | \n", "1.000000 | \n", "0.946427 | \n", "0.811533 | \n", "0.065573 | \n", "0.767021 | \n", "0.441015 | \n", "0.856639 | \n", "0.194718 | \n", "... | \n", "0.019009 | \n", "0.025281 | \n", "0.510202 | \n", "0.078068 | \n", "0.015855 | \n", "0.092469 | \n", "0.077274 | \n", "0.031017 | \n", "0.374283 | \n", "0.242737 | \n", "
ENSG00000269981 | \n", "0.504516 | \n", "0.809451 | \n", "0.946427 | \n", "1.000000 | \n", "0.833857 | \n", "0.110389 | \n", "0.656542 | \n", "0.527122 | \n", "0.903084 | \n", "0.067739 | \n", "... | \n", "0.069903 | \n", "0.070774 | \n", "0.478497 | \n", "0.264099 | \n", "0.021557 | \n", "0.101842 | \n", "0.079891 | \n", "0.014742 | \n", "0.169647 | \n", "0.230788 | \n", "
ENSG00000241860 | \n", "0.479969 | \n", "0.673940 | \n", "0.811533 | \n", "0.833857 | \n", "1.000000 | \n", "0.083856 | \n", "0.508489 | \n", "0.340035 | \n", "0.944649 | \n", "0.002976 | \n", "... | \n", "0.208856 | \n", "0.125405 | \n", "0.327995 | \n", "0.624400 | \n", "0.257520 | \n", "0.018642 | \n", "0.034978 | \n", "0.019394 | \n", "0.278851 | \n", "0.139266 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
ENSG00000276345 | \n", "0.085152 | \n", "0.055478 | \n", "0.092469 | \n", "0.101842 | \n", "0.018642 | \n", "0.001793 | \n", "0.261986 | \n", "0.020327 | \n", "0.091009 | \n", "0.017107 | \n", "... | \n", "0.007437 | \n", "0.026895 | \n", "0.174295 | \n", "0.115015 | \n", "0.018660 | \n", "1.000000 | \n", "0.011710 | \n", "0.004271 | \n", "0.095571 | \n", "0.024167 | \n", "
ENSG00000277856 | \n", "0.025113 | \n", "0.045883 | \n", "0.077274 | \n", "0.079891 | \n", "0.034978 | \n", "0.067405 | \n", "0.140386 | \n", "0.012266 | \n", "0.094181 | \n", "0.032696 | \n", "... | \n", "0.003437 | \n", "0.000490 | \n", "0.095768 | \n", "0.078241 | \n", "0.056294 | \n", "0.011710 | \n", "1.000000 | \n", "0.738243 | \n", "0.057777 | \n", "0.063847 | \n", "
ENSG00000275063 | \n", "0.005367 | \n", "0.013963 | \n", "0.031017 | \n", "0.014742 | \n", "0.019394 | \n", "0.019134 | \n", "0.067660 | \n", "0.011989 | \n", "0.042390 | \n", "0.051837 | \n", "... | \n", "0.005523 | \n", "0.000559 | \n", "0.062007 | \n", "0.091597 | \n", "0.009911 | \n", "0.004271 | \n", "0.738243 | \n", "1.000000 | \n", "0.005105 | \n", "0.007100 | \n", "
ENSG00000278817 | \n", "0.458116 | \n", "0.154940 | \n", "0.374283 | \n", "0.169647 | \n", "0.278851 | \n", "0.255696 | \n", "0.762126 | \n", "0.355218 | \n", "0.176952 | \n", "0.365041 | \n", "... | \n", "0.063697 | \n", "0.229018 | \n", "0.651330 | \n", "0.456410 | \n", "0.063993 | \n", "0.095571 | \n", "0.057777 | \n", "0.005105 | \n", "1.000000 | \n", "0.851643 | \n", "
ENSG00000277196 | \n", "0.389884 | \n", "0.049407 | \n", "0.242737 | \n", "0.230788 | \n", "0.139266 | \n", "0.257408 | \n", "0.619342 | \n", "0.117430 | \n", "0.171613 | \n", "0.250084 | \n", "... | \n", "0.012124 | \n", "0.167913 | \n", "0.475094 | \n", "0.344548 | \n", "0.027745 | \n", "0.024167 | \n", "0.063847 | \n", "0.007100 | \n", "0.851643 | \n", "1.000000 | \n", "
24631 rows × 24631 columns
\n", "\n", " | ENSG00000227232 | \n", "ENSG00000223972 | \n", "ENSG00000237613 | \n", "ENSG00000186092 | \n", "ENSG00000235249 | \n", "ENSG00000185097 | \n", "ENSG00000228327 | \n", "ENSG00000228794 | \n", "ENSG00000230368 | \n", "ENSG00000230699 | \n", "... | \n", "ENSG00000177151 | \n", "ENSG00000187701 | \n", "ENSG00000189181 | \n", "ENSG00000232694 | \n", "ENSG00000266949 | \n", "ENSG00000175137 | \n", "ENSG00000264500 | \n", "ENSG00000171161 | \n", "ENSG00000171163 | \n", "ENSG00000185220 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
Gene stable ID | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
ENSG00000227232 | \n", "0 | \n", "26 | \n", "26 | \n", "26 | \n", "0 | \n", "1011 | \n", "379 | \n", "379 | \n", "208 | \n", "208 | \n", "... | \n", "29 | \n", "29 | \n", "29 | \n", "29 | \n", "47 | \n", "207 | \n", "207 | \n", "207 | \n", "207 | \n", "1815 | \n", "
ENSG00000223972 | \n", "26 | \n", "0 | \n", "26 | \n", "26 | \n", "0 | \n", "1011 | \n", "379 | \n", "379 | \n", "208 | \n", "208 | \n", "... | \n", "29 | \n", "29 | \n", "29 | \n", "29 | \n", "47 | \n", "207 | \n", "207 | \n", "207 | \n", "207 | \n", "1815 | \n", "
ENSG00000237613 | \n", "26 | \n", "26 | \n", "0 | \n", "26 | \n", "0 | \n", "1011 | \n", "379 | \n", "379 | \n", "208 | \n", "208 | \n", "... | \n", "29 | \n", "29 | \n", "29 | \n", "29 | \n", "47 | \n", "207 | \n", "207 | \n", "207 | \n", "207 | \n", "1815 | \n", "
ENSG00000186092 | \n", "26 | \n", "26 | \n", "26 | \n", "0 | \n", "0 | \n", "1011 | \n", "379 | \n", "379 | \n", "208 | \n", "208 | \n", "... | \n", "29 | \n", "29 | \n", "29 | \n", "29 | \n", "47 | \n", "207 | \n", "207 | \n", "207 | \n", "207 | \n", "1815 | \n", "
ENSG00000235249 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
ENSG00000175137 | \n", "207 | \n", "207 | \n", "207 | \n", "207 | \n", "0 | \n", "192 | \n", "136 | \n", "136 | \n", "74 | \n", "74 | \n", "... | \n", "4900 | \n", "4900 | \n", "4900 | \n", "4900 | \n", "5000 | \n", "0 | \n", "18 | \n", "18 | \n", "18 | \n", "18 | \n", "
ENSG00000264500 | \n", "207 | \n", "207 | \n", "207 | \n", "207 | \n", "0 | \n", "192 | \n", "136 | \n", "136 | \n", "74 | \n", "74 | \n", "... | \n", "4900 | \n", "4900 | \n", "4900 | \n", "4900 | \n", "5000 | \n", "18 | \n", "0 | \n", "18 | \n", "18 | \n", "18 | \n", "
ENSG00000171161 | \n", "207 | \n", "207 | \n", "207 | \n", "207 | \n", "0 | \n", "192 | \n", "136 | \n", "136 | \n", "74 | \n", "74 | \n", "... | \n", "4900 | \n", "4900 | \n", "4900 | \n", "4900 | \n", "5000 | \n", "18 | \n", "18 | \n", "0 | \n", "18 | \n", "18 | \n", "
ENSG00000171163 | \n", "207 | \n", "207 | \n", "207 | \n", "207 | \n", "0 | \n", "192 | \n", "136 | \n", "136 | \n", "74 | \n", "74 | \n", "... | \n", "4900 | \n", "4900 | \n", "4900 | \n", "4900 | \n", "5000 | \n", "18 | \n", "18 | \n", "18 | \n", "0 | \n", "18 | \n", "
ENSG00000185220 | \n", "1815 | \n", "1815 | \n", "1815 | \n", "1815 | \n", "0 | \n", "291 | \n", "161 | \n", "161 | \n", "96 | \n", "96 | \n", "... | \n", "3769 | \n", "3769 | \n", "3769 | \n", "3769 | \n", "3869 | \n", "18 | \n", "18 | \n", "18 | \n", "18 | \n", "0 | \n", "
2426 rows × 2426 columns
\n", "\n", " | ENSG00000227232 | \n", "ENSG00000223972 | \n", "ENSG00000237613 | \n", "ENSG00000186092 | \n", "ENSG00000235249 | \n", "ENSG00000185097 | \n", "ENSG00000228327 | \n", "ENSG00000228794 | \n", "ENSG00000230368 | \n", "ENSG00000230699 | \n", "... | \n", "ENSG00000177151 | \n", "ENSG00000187701 | \n", "ENSG00000189181 | \n", "ENSG00000232694 | \n", "ENSG00000266949 | \n", "ENSG00000175137 | \n", "ENSG00000264500 | \n", "ENSG00000171161 | \n", "ENSG00000171163 | \n", "ENSG00000185220 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
Gene stable ID | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
ENSG00000227232 | \n", "0 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "... | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "
ENSG00000223972 | \n", "1 | \n", "0 | \n", "1 | \n", "1 | \n", "0 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "... | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "
ENSG00000237613 | \n", "1 | \n", "1 | \n", "0 | \n", "1 | \n", "0 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "... | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "
ENSG00000186092 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "0 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "... | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "
ENSG00000235249 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
ENSG00000175137 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "... | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "
ENSG00000264500 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "... | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "1 | \n", "1 | \n", "1 | \n", "
ENSG00000171161 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "... | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "1 | \n", "1 | \n", "
ENSG00000171163 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "... | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "1 | \n", "
ENSG00000185220 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "... | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "
2426 rows × 2426 columns
\n", "\n", " | tss_tss | \n", "exp | \n", "exp_georg | \n", "hi-c-rao | \n", "strand_x | \n", "gene_order_tss_x | \n", "gene_order_tes_x | \n", "Gene stable ID_x | \n", "Gene type_x | \n", "Uniprot_dc_x | \n", "... | \n", "chrom_x | \n", "strand_y | \n", "gene_order_tss_y | \n", "gene_order_tes_y | \n", "Gene stable ID_y | \n", "Gene type_y | \n", "Uniprot_dc_y | \n", "dc_y | \n", "seq_length_y | \n", "chrom_y | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "0 | \n", "1.000000 | \n", "0.851248 | \n", "0.0 | \n", "+ | \n", "1013 | \n", "1015 | \n", "ENSG00000089289 | \n", "protein_coding | \n", "P78318 | \n", "... | \n", "chrX | \n", "+ | \n", "1013 | \n", "1015 | \n", "ENSG00000089289 | \n", "protein_coding | \n", "P78318 | \n", "0.218289 | \n", "339.0 | \n", "chrX | \n", "
1 | \n", "48500772 | \n", "0.194329 | \n", "NaN | \n", "NaN | \n", "- | \n", "1693 | \n", "1692 | \n", "ENSG00000230399 | \n", "NaN | \n", "NaN | \n", "... | \n", "chrX | \n", "+ | \n", "1013 | \n", "1015 | \n", "ENSG00000089289 | \n", "protein_coding | \n", "P78318 | \n", "0.218289 | \n", "339.0 | \n", "chrX | \n", "
2 | \n", "14644244 | \n", "0.912021 | \n", "NaN | \n", "2119.0 | \n", "- | \n", "891 | \n", "891 | \n", "ENSG00000247746 | \n", "protein_coding | \n", "Q70EK9 | \n", "... | \n", "chrX | \n", "+ | \n", "1013 | \n", "1015 | \n", "ENSG00000089289 | \n", "protein_coding | \n", "P78318 | \n", "0.218289 | \n", "339.0 | \n", "chrX | \n", "
3 | \n", "22650500 | \n", "0.964389 | \n", "NaN | \n", "1966.0 | \n", "- | \n", "598 | \n", "597 | \n", "ENSG00000147124 | \n", "protein_coding | \n", "P51814 | \n", "... | \n", "chrX | \n", "+ | \n", "1013 | \n", "1015 | \n", "ENSG00000089289 | \n", "protein_coding | \n", "P78318 | \n", "0.218289 | \n", "339.0 | \n", "chrX | \n", "
4 | \n", "13404206 | \n", "0.989904 | \n", "NaN | \n", "2345.0 | \n", "+ | \n", "905 | \n", "907 | \n", "ENSG00000204272 | \n", "protein_coding | \n", "A0A0U1RRE5 | \n", "... | \n", "chrX | \n", "+ | \n", "1013 | \n", "1015 | \n", "ENSG00000089289 | \n", "protein_coding | \n", "P78318 | \n", "0.218289 | \n", "339.0 | \n", "chrX | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
597524 | \n", "30681475 | \n", "0.903413 | \n", "NaN | \n", "NaN | \n", "+ | \n", "2358 | \n", "2359 | \n", "ENSG00000269335 | \n", "protein_coding | \n", "Q9Y6K9 | \n", "... | \n", "chrX | \n", "+ | \n", "1809 | \n", "1812 | \n", "ENSG00000101966 | \n", "protein_coding | \n", "P98170 | \n", "0.000000 | \n", "497.0 | \n", "chrX | \n", "
597525 | \n", "5020185 | \n", "0.513123 | \n", "NaN | \n", "4116.0 | \n", "+ | \n", "1698 | \n", "1699 | \n", "ENSG00000203650 | \n", "NaN | \n", "NaN | \n", "... | \n", "chrX | \n", "+ | \n", "1809 | \n", "1812 | \n", "ENSG00000101966 | \n", "protein_coding | \n", "P98170 | \n", "0.000000 | \n", "497.0 | \n", "chrX | \n", "
597526 | \n", "103592204 | \n", "0.985573 | \n", "0.701583 | \n", "270.0 | \n", "- | \n", "254 | \n", "254 | \n", "ENSG00000177189 | \n", "protein_coding | \n", "P51812 | \n", "... | \n", "chrX | \n", "+ | \n", "1809 | \n", "1812 | \n", "ENSG00000101966 | \n", "protein_coding | \n", "P98170 | \n", "0.000000 | \n", "497.0 | \n", "chrX | \n", "
597527 | \n", "8359757 | \n", "0.973737 | \n", "0.705286 | \n", "3663.0 | \n", "- | \n", "1913 | \n", "1912 | \n", "ENSG00000123728 | \n", "protein_coding | \n", "Q9Y3L5 | \n", "... | \n", "chrX | \n", "+ | \n", "1809 | \n", "1812 | \n", "ENSG00000101966 | \n", "protein_coding | \n", "P98170 | \n", "0.000000 | \n", "497.0 | \n", "chrX | \n", "
597528 | \n", "0 | \n", "1.000000 | \n", "0.851248 | \n", "0.0 | \n", "+ | \n", "1809 | \n", "1812 | \n", "ENSG00000101966 | \n", "protein_coding | \n", "P98170 | \n", "... | \n", "chrX | \n", "+ | \n", "1809 | \n", "1812 | \n", "ENSG00000101966 | \n", "protein_coding | \n", "P98170 | \n", "0.000000 | \n", "497.0 | \n", "chrX | \n", "
597529 rows × 22 columns
\n", "\n", " | tss_tss | \n", "exp | \n", "hi-c-rao | \n", "Gene stable ID_x | \n", "Gene stable ID_y | \n", "chrom_x | \n", "gene_order_tss_x | \n", "gene_order_tss_y | \n", "
---|---|---|---|---|---|---|---|---|
0 | \n", "0 | \n", "0.999161 | \n", "0.0 | \n", "ENSG00000101868 | \n", "ENSG00000101868 | \n", "chrX | \n", "308 | \n", "308 | \n", "
4 | \n", "15885463 | \n", "0.794246 | \n", "1278.0 | \n", "ENSG00000182220 | \n", "ENSG00000101868 | \n", "chrX | \n", "476 | \n", "308 | \n", "
5 | \n", "129717615 | \n", "0.745656 | \n", "282.0 | \n", "ENSG00000102125 | \n", "ENSG00000101868 | \n", "chrX | \n", "2344 | \n", "308 | \n", "
6 | \n", "40340805 | \n", "0.928513 | \n", "987.0 | \n", "ENSG00000126970 | \n", "ENSG00000101868 | \n", "chrX | \n", "950 | \n", "308 | \n", "
7 | \n", "68980104 | \n", "0.263513 | \n", "694.0 | \n", "ENSG00000179083 | \n", "ENSG00000101868 | \n", "chrX | \n", "1331 | \n", "308 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
597524 | \n", "37279597 | \n", "0.398370 | \n", "1065.0 | \n", "ENSG00000158427 | \n", "ENSG00000131080 | \n", "chrX | \n", "1507 | \n", "976 | \n", "
597525 | \n", "8728478 | \n", "0.641730 | \n", "3344.0 | \n", "ENSG00000198205 | \n", "ENSG00000131080 | \n", "chrX | \n", "920 | \n", "976 | \n", "
597526 | \n", "19056891 | \n", "0.424817 | \n", "1580.0 | \n", "ENSG00000102265 | \n", "ENSG00000131080 | \n", "chrX | \n", "602 | \n", "976 | \n", "
597527 | \n", "5271519 | \n", "0.441382 | \n", "2781.0 | \n", "ENSG00000204131 | \n", "ENSG00000131080 | \n", "chrX | \n", "1079 | \n", "976 | \n", "
597528 | \n", "0 | \n", "0.999161 | \n", "0.0 | \n", "ENSG00000131080 | \n", "ENSG00000131080 | \n", "chrX | \n", "976 | \n", "976 | \n", "
356409 rows × 8 columns
\n", "\n", " | tss_tss | \n", "exp | \n", "hi-c-rao | \n", "Gene stable ID_x | \n", "Gene stable ID_y | \n", "chrom_x | \n", "exp_mean | \n", "
---|---|---|---|---|---|---|---|
pairs | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
ENSG00000101868_ENSG00000101868 | \n", "0 | \n", "1.000000 | \n", "0.0 | \n", "ENSG00000101868 | \n", "ENSG00000101868 | \n", "chrX | \n", "0.605398 | \n", "
ENSG00000101868_ENSG00000182220 | \n", "15885463 | \n", "0.893384 | \n", "1278.0 | \n", "ENSG00000182220 | \n", "ENSG00000101868 | \n", "chrX | \n", "0.704656 | \n", "
ENSG00000101868_ENSG00000102125 | \n", "129717615 | \n", "0.864865 | \n", "282.0 | \n", "ENSG00000102125 | \n", "ENSG00000101868 | \n", "chrX | \n", "0.625642 | \n", "
ENSG00000101868_ENSG00000126970 | \n", "40340805 | \n", "0.963447 | \n", "987.0 | \n", "ENSG00000126970 | \n", "ENSG00000101868 | \n", "chrX | \n", "0.702912 | \n", "
ENSG00000101868_ENSG00000179083 | \n", "68980104 | \n", "0.423822 | \n", "694.0 | \n", "ENSG00000179083 | \n", "ENSG00000101868 | \n", "chrX | \n", "0.425180 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
ENSG00000131080_ENSG00000158427 | \n", "37279597 | \n", "0.574872 | \n", "1065.0 | \n", "ENSG00000158427 | \n", "ENSG00000131080 | \n", "chrX | \n", "0.566538 | \n", "
ENSG00000131080_ENSG00000198205 | \n", "8728478 | \n", "0.794596 | \n", "3344.0 | \n", "ENSG00000198205 | \n", "ENSG00000131080 | \n", "chrX | \n", "0.567519 | \n", "
ENSG00000131080_ENSG00000102265 | \n", "19056891 | \n", "0.601445 | \n", "1580.0 | \n", "ENSG00000102265 | \n", "ENSG00000131080 | \n", "chrX | \n", "0.581551 | \n", "
ENSG00000131080_ENSG00000204131 | \n", "5271519 | \n", "0.617975 | \n", "2781.0 | \n", "ENSG00000204131 | \n", "ENSG00000131080 | \n", "chrX | \n", "0.583395 | \n", "
ENSG00000131080_ENSG00000131080 | \n", "0 | \n", "1.000000 | \n", "0.0 | \n", "ENSG00000131080 | \n", "ENSG00000131080 | \n", "chrX | \n", "0.767078 | \n", "
356409 rows × 7 columns
\n", "\n", " | chrm | \n", "num_pairs | \n", "dist_thresh | \n", "auc | \n", "plot | \n", "pr_curve | \n", "true_pos | \n", "true_neg | \n", "exp_median | \n", "exp_mean | \n", "exp_var | \n", "Gene stable ID | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "chr11 | \n", "1004 | \n", "4000 | \n", "NaN | \n", "{0.0: nan, 0.01: nan, 0.02: nan, 0.03: nan, 0.... | \n", "{} | \n", "0 | \n", "650 | \n", "0.592583 | \n", "0.547375 | \n", "0.063044 | \n", "ENSG00000174669 | \n", "
1 | \n", "chr11 | \n", "1004 | \n", "4000 | \n", "NaN | \n", "{0.0: nan, 0.01: nan, 0.02: nan, 0.03: nan, 0.... | \n", "{} | \n", "0 | \n", "932 | \n", "0.732026 | \n", "0.656574 | \n", "0.070272 | \n", "ENSG00000183340 | \n", "
2 | \n", "chr11 | \n", "1004 | \n", "4000 | \n", "NaN | \n", "{0.0: nan, 0.01: nan, 0.02: nan, 0.03: nan, 0.... | \n", "{} | \n", "0 | \n", "647 | \n", "0.392391 | \n", "0.379631 | \n", "0.036577 | \n", "ENSG00000182791 | \n", "
3 | \n", "chr11 | \n", "1004 | \n", "4000 | \n", "NaN | \n", "{0.0: nan, 0.01: nan, 0.02: nan, 0.03: nan, 0.... | \n", "{} | \n", "0 | \n", "828 | \n", "0.822697 | \n", "0.728352 | \n", "0.067169 | \n", "ENSG00000132275 | \n", "
4 | \n", "chr11 | \n", "1004 | \n", "4000 | \n", "0.561063 | \n", "{0.0: 0.0, 0.01: 0.0, 0.02: 0.0104166666666666... | \n", "{0.0: 0.0, 0.08: 0.021899579772188874, 0.17: 0... | \n", "12 | \n", "696 | \n", "0.650224 | \n", "0.608971 | \n", "0.084299 | \n", "ENSG00000168496 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
999 | \n", "chr11 | \n", "1004 | \n", "4000 | \n", "NaN | \n", "{0.0: nan, 0.01: nan, 0.02: nan, 0.03: nan, 0.... | \n", "{} | \n", "0 | \n", "896 | \n", "0.710174 | \n", "0.617268 | \n", "0.067416 | \n", "ENSG00000151702 | \n", "
1000 | \n", "chr11 | \n", "1004 | \n", "4000 | \n", "0.820235 | \n", "{0.0: 0.0, 0.01: 0.0, 0.02: 0.0, 0.03: 0.0, 0.... | \n", "{0.0: 0.0, 0.33: 0.011573465587966434, 0.67: 0... | \n", "3 | \n", "738 | \n", "0.580503 | \n", "0.522850 | \n", "0.076284 | \n", "ENSG00000156587 | \n", "
1001 | \n", "chr11 | \n", "1004 | \n", "4000 | \n", "NaN | \n", "{0.0: nan, 0.01: nan, 0.02: nan, 0.03: nan, 0.... | \n", "{} | \n", "0 | \n", "646 | \n", "0.653405 | \n", "0.605870 | \n", "0.066594 | \n", "ENSG00000173715 | \n", "
1002 | \n", "chr11 | \n", "1004 | \n", "4000 | \n", "0.427163 | \n", "{0.0: 0.0, 0.01: 0.0, 0.02: 0.0, 0.03: 0.01739... | \n", "{0.0: 0.0, 0.04: 0.03137291143578475, 0.09: 0.... | \n", "23 | \n", "913 | \n", "0.657461 | \n", "0.592015 | \n", "0.051981 | \n", "ENSG00000166086 | \n", "
1003 | \n", "chr11 | \n", "1004 | \n", "4000 | \n", "NaN | \n", "{0.0: nan, 0.01: nan, 0.02: nan, 0.03: nan, 0.... | \n", "{} | \n", "0 | \n", "647 | \n", "0.728689 | \n", "0.649545 | \n", "0.071352 | \n", "ENSG00000239306 | \n", "
1004 rows × 12 columns
\n", "\n", " | chrm | \n", "num_pairs | \n", "dist_thresh | \n", "auc | \n", "plot | \n", "pr_curve | \n", "true_pos | \n", "true_neg | \n", "exp_median | \n", "exp_mean | \n", "exp_var | \n", "Gene stable ID | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|
4 | \n", "chr16 | \n", "773 | \n", "2000 | \n", "NaN | \n", "{0.0: nan, 0.01: nan, 0.02: nan, 0.03: nan, 0.... | \n", "{} | \n", "0 | \n", "495 | \n", "0.345003 | \n", "0.322651 | \n", "0.030117 | \n", "ENSG00000245694 | \n", "
9 | \n", "chr16 | \n", "773 | \n", "2000 | \n", "NaN | \n", "{0.0: nan, 0.01: nan, 0.02: nan, 0.03: nan, 0.... | \n", "{} | \n", "0 | \n", "496 | \n", "0.619299 | \n", "0.585025 | \n", "0.087750 | \n", "ENSG00000245694 | \n", "
14 | \n", "chr16 | \n", "773 | \n", "2000 | \n", "NaN | \n", "{0.0: nan, 0.01: nan, 0.02: nan, 0.03: nan, 0.... | \n", "{} | \n", "0 | \n", "437 | \n", "0.486055 | \n", "0.477094 | \n", "0.069154 | \n", "ENSG00000198931 | \n", "
19 | \n", "chr16 | \n", "773 | \n", "2000 | \n", "NaN | \n", "{0.0: nan, 0.01: nan, 0.02: nan, 0.03: nan, 0.... | \n", "{} | \n", "0 | \n", "420 | \n", "0.554352 | \n", "0.556762 | \n", "0.077769 | \n", "ENSG00000243716 | \n", "
24 | \n", "chr16 | \n", "773 | \n", "2000 | \n", "NaN | \n", "{0.0: nan, 0.01: nan, 0.02: nan, 0.03: nan, 0.... | \n", "{} | \n", "0 | \n", "428 | \n", "0.828832 | \n", "0.726001 | \n", "0.064853 | \n", "ENSG00000168434 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
3844 | \n", "chr16 | \n", "773 | \n", "2000 | \n", "NaN | \n", "{0.0: nan, 0.01: nan, 0.02: nan, 0.03: nan, 0.... | \n", "{} | \n", "0 | \n", "428 | \n", "0.425241 | \n", "0.405120 | \n", "0.049482 | \n", "ENSG00000260807 | \n", "
3849 | \n", "chr16 | \n", "773 | \n", "2000 | \n", "NaN | \n", "{0.0: nan, 0.01: nan, 0.02: nan, 0.03: nan, 0.... | \n", "{} | \n", "0 | \n", "432 | \n", "0.490119 | \n", "0.454270 | \n", "0.064232 | \n", "ENSG00000169627 | \n", "
3854 | \n", "chr16 | \n", "773 | \n", "2000 | \n", "NaN | \n", "{0.0: nan, 0.01: nan, 0.02: nan, 0.03: nan, 0.... | \n", "{} | \n", "0 | \n", "442 | \n", "0.474922 | \n", "0.465165 | \n", "0.052825 | \n", "ENSG00000248124 | \n", "
3859 | \n", "chr16 | \n", "773 | \n", "2000 | \n", "NaN | \n", "{0.0: nan, 0.01: nan, 0.02: nan, 0.03: nan, 0.... | \n", "{} | \n", "0 | \n", "494 | \n", "0.360949 | \n", "0.368468 | \n", "0.032043 | \n", "ENSG00000102935 | \n", "
3864 | \n", "chr16 | \n", "773 | \n", "2000 | \n", "NaN | \n", "{0.0: nan, 0.01: nan, 0.02: nan, 0.03: nan, 0.... | \n", "{} | \n", "0 | \n", "495 | \n", "0.572479 | \n", "0.551079 | \n", "0.061528 | \n", "ENSG00000177200 | \n", "
773 rows × 12 columns
\n", "\n", " | chrm | \n", "num_pairs | \n", "dist_thresh | \n", "auc | \n", "pr_curve | \n", "true_pos | \n", "true_neg | \n", "exp_median | \n", "exp_mean | \n", "exp_var | \n", "... | \n", "0.82 | \n", "0.83 | \n", "0.85 | \n", "0.86 | \n", "0.88 | \n", "0.89 | \n", "0.9 | \n", "0.91 | \n", "0.92 | \n", "1.0 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "chr11 | \n", "1004 | \n", "2.0 | \n", "0.603357 | \n", "{0.0: 1.0, 0.01: 1.0, 0.02: 1.0, 0.03: 1.0, 0.... | \n", "566 | \n", "2 | \n", "0.818331 | \n", "0.709948 | \n", "0.077252 | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.863074 | \n", "
1 | \n", "chr11 | \n", "1004 | \n", "1.0 | \n", "0.950000 | \n", "{0.0: 1.0, 0.01: 1.0, 0.02: 1.0, 0.03: 1.0, 0.... | \n", "480 | \n", "1 | \n", "0.711796 | \n", "0.638367 | \n", "0.072380 | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.975000 | \n", "
2 | \n", "chr11 | \n", "1004 | \n", "1.0 | \n", "0.990826 | \n", "{0.0: 1.0, 0.01: 1.0, 0.02: 1.0, 0.03: 1.0, 0.... | \n", "436 | \n", "1 | \n", "0.680995 | \n", "0.613632 | \n", "0.075320 | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.995413 | \n", "
3 | \n", "chr11 | \n", "1004 | \n", "2.0 | \n", "0.964930 | \n", "{0.0: 1.0, 0.01: 1.0, 0.02: 1.0, 0.03: 1.0, 0.... | \n", "499 | \n", "2 | \n", "0.690213 | \n", "0.630627 | \n", "0.070869 | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.994990 | \n", "
4 | \n", "chr11 | \n", "1004 | \n", "5.0 | \n", "0.937400 | \n", "{0.0: 1.0, 0.01: 1.0, 0.02: 1.0, 0.03: 1.0, 0.... | \n", "623 | \n", "2 | \n", "0.712888 | \n", "0.625489 | \n", "0.079132 | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.981541 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
999 | \n", "chr11 | \n", "1004 | \n", "2.0 | \n", "0.074297 | \n", "{0.0: 1.0, 0.01: 1.0, 0.02: 1.0, 0.03: 1.0, 0.... | \n", "498 | \n", "1 | \n", "0.061497 | \n", "0.109356 | \n", "0.028743 | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.537149 | \n", "
1000 | \n", "chr11 | \n", "1004 | \n", "6.0 | \n", "0.426445 | \n", "{0.0: 1.0, 0.01: 1.0, 0.02: 1.0, 0.03: 1.0, 0.... | \n", "571 | \n", "2 | \n", "0.264574 | \n", "0.274264 | \n", "0.040111 | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.834501 | \n", "
1001 | \n", "chr11 | \n", "1004 | \n", "6.0 | \n", "0.650485 | \n", "{0.0: 1.0, 0.01: 1.0, 0.02: 1.0, 0.03: 1.0, 0.... | \n", "618 | \n", "1 | \n", "0.480949 | \n", "0.495839 | \n", "0.064536 | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.825243 | \n", "
1002 | \n", "chr11 | \n", "1004 | \n", "6.0 | \n", "0.793478 | \n", "{0.0: 1.0, 0.01: 1.0, 0.02: 1.0, 0.03: 1.0, 0.... | \n", "552 | \n", "3 | \n", "0.684659 | \n", "0.632675 | \n", "0.075314 | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.987319 | \n", "
1003 | \n", "chr11 | \n", "1004 | \n", "6.0 | \n", "0.855932 | \n", "{0.0: 1.0, 0.01: 1.0, 0.02: 1.0, 0.03: 1.0, 0.... | \n", "472 | \n", "1 | \n", "0.745523 | \n", "0.660855 | \n", "0.078882 | \n", "... | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.927966 | \n", "
1004 rows × 66 columns
\n", "