{ "cells": [ { "cell_type": "code", "execution_count": 402, "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "import matplotlib.pyplot as plt" ] }, { "cell_type": "code", "execution_count": 581, "metadata": {}, "outputs": [], "source": [ "import re \n", "def sorted_nicely( l ): \n", " \"\"\" Sort the given iterable in the way that humans expect.\"\"\" \n", " convert = lambda text: int(text) if text.isdigit() else text \n", " alphanum_key = lambda key: [ convert(c) for c in re.split('([0-9]+)', key) ] \n", " return sorted(l, key = alphanum_key)" ] }, { "cell_type": "code", "execution_count": 1294, "metadata": {}, "outputs": [], "source": [ "import matplotlib\n", "import matplotlib.pyplot as plt\n", "from matplotlib.colors import LinearSegmentedColormap\n", "import matplotlib.ticker as plticker\n", "from matplotlib.colors import LogNorm\n", "\n", "\n", "def plots_with_1_level(group_x):\n", "\n", " change_group_level_1 = df_2_or_uniq.groupby(['chrom_x'])\n", " nrow = int(len(change_group_level_1.groups.keys())/3) + 1\n", " ncol = 3\n", " fig, axes = plt.subplots(nrows=nrow, ncols=ncol, figsize=(4*ncol, 4*nrow),sharex=True,sharey=True) \n", "\n", " for key_level_1,ax in zip(sorted_nicely(change_group_level_1.groups.keys()),axes.flatten()):\n", " given_group_level_1 = change_group_level_1.get_group(key_level_1)\n", " #given_group2 = given_group_level_1.groupby(['order_diff', 'category']).mean().groupby(level=2)['exp'].plot(ax=ax)\n", " given_group2 = given_group_level_1.groupby([group_x]).mean()['exp'].plot(ax=ax)\n", " given_group2 = given_group_level_1.groupby([group_x]).mean()['exp (GK)'].plot(ax=ax)\n", " #given_group2 = given_group_level_1.groupby([group_x]).mean()['SRP063477'].plot(ax=ax)\n", " #given_group2 = given_group_level_1.groupby([group_x]).mean()['SRP026208'].plot(ax=ax)\n", " #given_group2 = given_group_level_1.groupby([group_x]).mean()['SRP115956'].plot(ax=ax)\n", "\n", " ax.axhline(y=0.5, color='r', linestyle='-')\n", " #ax.set_xlim([0, 2000])\n", " ax.legend()\n", " rects = ax.patches \n", " ax.set_title('%s' %(key_level_1))\n", " #ax.set_ylabel('%Population')\n", " ax.set_xlabel('Distance between gene pairs (MB)')\n", " ax.set_ylabel('Co-expression')\n", " \n", "\n", "def plots_with_2_groups(group_2='None', group_3_x='category'): \n", " change_group_level_1 = df_2_or_uniq.groupby(['chrom_x'])\n", " change_group_level_2 = df_2_or_uniq.groupby([group_2])\n", " nrow = len(change_group_level_1.groups.keys())\n", " ncol = len(change_group_level_2.groups.keys())\n", " fig, axes = plt.subplots(nrows=nrow, ncols=ncol, figsize=(8*ncol, 8*nrow),sharey=True) \n", "\n", " for key_level_1,ax_row in zip(sorted_nicely(change_group_level_1.groups.keys()) ,axes):\n", " given_group_level_1 = change_group_level_1.get_group(key_level_1)\n", " change_group = given_group_level_1.groupby([group_2])\n", " for key,ax in zip(change_group.groups.keys(),ax_row):\n", " given_group = change_group.get_group(key)\n", " #given_group2 = given_group.groupby([group_3_x, 'category']).mean().groupby(level=1)['exp'].plot(ax=ax)\n", " given_group2 = given_group.groupby([group_3_x]).mean()['exp'].plot(ax=ax)\n", " given_group2 = given_group.groupby([group_3_x]).mean()['exp_georg'].plot(ax=ax)\n", " ax.legend()\n", " rects = ax.patches \n", " ax.set_title('%s, %s' %(key_level_1,key))\n", " ax.axhline(y=0.5, color='r', linestyle='-')\n", " ax.set_ylabel('%Population')\n", " ax.set_ylim([0.3, 0.9])\n", " \n", " \n", "def plots_with_2_groups_same_plot(group_2='None', group_3_x='category'): \n", " change_group_level_1 = df_2_or_uniq.groupby(['chrom_x'])\n", " change_group_level_2 = df_2_or_uniq.groupby([group_2])\n", " nrow = int(len(change_group_level_1.groups.keys())/3) + 1\n", " ncol = 3\n", " fig, axes = plt.subplots(nrows=nrow, ncols=ncol, figsize=(4*ncol, 4*nrow),sharey=True, sharex=True) \n", "\n", " for key_level_1,ax in zip(sorted_nicely(change_group_level_1.groups.keys()) ,axes.flatten()):\n", " given_group_level_1 = change_group_level_1.get_group(key_level_1)\n", " change_group = given_group_level_1.groupby([group_2])\n", " for key in change_group.groups.keys():\n", " given_group = change_group.get_group(key)\n", " #given_group2 = given_group.groupby([group_3_x, 'category']).mean().groupby(level=1)['exp'].plot(ax=ax)\n", " given_group2 = given_group.groupby([group_3_x]).mean()['exp'].plot(ax=ax)\n", " #given_group2 = given_group.groupby([group_3_x]).mean()['exp_georg'].plot(ax=ax)\n", " #ax.legend()\n", " rects = ax.patches \n", " ax.set_title('%s, %s' %(key_level_1,key))\n", " ax.axhline(y=0.5, color='r', linestyle='-')\n", " ax.set_ylabel('Co-expression')\n", " ax.set_xlabel('Distance between gene pairs (MB)')\n", " #ax.set_ylim([0.3, 0.9])\n", " \n", "\n", "def plots_with_1_level_3d(df, group_x):\n", " change_group_level_1 = df.groupby(['chrom_x'])\n", " nrow = int(len(change_group_level_1.groups.keys())/3) + 2\n", " ncol = 3\n", " fig, axes = plt.subplots(nrows=nrow, ncols=ncol, figsize=(4*ncol, 4*nrow)) \n", "\n", " for key_level_1,ax in zip(sorted_nicely(change_group_level_1.groups.keys()),axes.flatten()):\n", " given_group_level_1 = change_group_level_1.get_group(key_level_1)\n", " H = given_group_level_1.pivot_table(index='gene_order_tss_x', columns='gene_order_tss_y', values=group_x)\n", " #print (H)\n", " #print ((H - H.T).max().max())\n", " #H.mask(H < 0, inplace=True)\n", " #elix.reset_index(drop=True, inplace=True)\n", " #print (H.max())\n", " vmax= 10\n", " cmap = LinearSegmentedColormap.from_list('mycmap', [(0/ vmax, 'red'), (1./2, 'white'), (vmax / vmax, 'blue')])\n", " #cmap = LinearSegmentedColormap.from_list('mycmap', [(0/ vmax, 'white'), (vmax / vmax, 'blue')])\n", " current_cmap = cmap\n", " #current_cmap.set_bad(color='grey')\n", " # vmax= 1000000\n", " # current_cmap = LinearSegmentedColormap.from_list('mycmap', [ (0/ vmax, 'white'), (vmax / vmax, 'blue')])\n", " # imgp = ax.imshow(H.T,origin='low', aspect='auto' , cmap=current_cmap, norm=LogNorm(vmin=1, vmax=vmax))\n", " \n", " imgp = ax.imshow(H,origin='low', aspect='auto' , vmin=-1.0, vmax=vmax, cmap=current_cmap)\n", " #imgp = ax.imshow(H,origin='low', aspect='auto' , norm=LogNorm(), cmap=current_cmap)\n", " #sns.heatmap(H, annot = False) \n", " ax.set_title('%s' %(key_level_1))\n", " ax.set_yticklabels([])\n", " ax.set_xticklabels([])\n", " ax.set_xlabel(\"Genes in chromosome order\")\n", " ax.set_ylabel(\"Genes in chromosome order\")\n", " \n", " #cbar = ax.figure.colorbar(imgp, ax=ax)" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "This is for plotting lowest Hi-c for each gene in heatmap" ] }, { "cell_type": "code", "execution_count": 1881, "metadata": {}, "outputs": [], "source": [ "df_2_or = pd.read_hdf('/data/lohia/gene_distance_expresseion/dist_files/11_dist_with_georg_hic_sub_median_hic_100.h5')" ] }, { "cell_type": "code", "execution_count": 1883, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | tss_tss | \n", "exp | \n", "exp_georg | \n", "hi-c-rao | \n", "hi-c-rao-common_elements | \n", "tes_tes | \n", "strand_x | \n", "txStart_outer_x | \n", "gene_order_tss_x | \n", "gene_order_tes_x | \n", "... | \n", "txStart_outer_y | \n", "gene_order_tss_y | \n", "gene_order_tes_y | \n", "Gene stable ID_y | \n", "Gene type_y | \n", "Uniprot_dc_y | \n", "dc_y | \n", "seq_length_y | \n", "chrom_y | \n", "gene_occurence_frequency_y | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
776092 | \n", "61185939 | \n", "0.365534 | \n", "NaN | \n", "18.0 | \n", "4.0 | \n", "60577069 | \n", "- | \n", "85682908 | \n", "2344 | \n", "2344 | \n", "... | \n", "24496969 | \n", "745 | \n", "746 | \n", "ENSG00000187398 | \n", "protein_coding | \n", "Q86TE4 | \n", "0.343931 | \n", "346.0 | \n", "chr11 | \n", "2623 | \n", "
776093 | \n", "38231099 | \n", "0.285114 | \n", "NaN | \n", "7.0 | \n", "4.0 | \n", "37657655 | \n", "+ | \n", "62728068 | \n", "1583 | \n", "1583 | \n", "... | \n", "24496969 | \n", "745 | \n", "746 | \n", "ENSG00000187398 | \n", "protein_coding | \n", "Q86TE4 | \n", "0.343931 | \n", "346.0 | \n", "chr11 | \n", "2623 | \n", "
776094 | \n", "42461417 | \n", "0.262901 | \n", "NaN | \n", "5.0 | \n", "4.0 | \n", "41765778 | \n", "- | \n", "66958386 | \n", "1863 | \n", "1860 | \n", "... | \n", "24496969 | \n", "745 | \n", "746 | \n", "ENSG00000187398 | \n", "protein_coding | \n", "Q86TE4 | \n", "0.343931 | \n", "346.0 | \n", "chr11 | \n", "2623 | \n", "
776095 | \n", "38344840 | \n", "0.104930 | \n", "NaN | \n", "10.0 | \n", "4.0 | \n", "37749703 | \n", "- | \n", "62841809 | \n", "1600 | \n", "1598 | \n", "... | \n", "24496969 | \n", "745 | \n", "746 | \n", "ENSG00000187398 | \n", "protein_coding | \n", "Q86TE4 | \n", "0.343931 | \n", "346.0 | \n", "chr11 | \n", "2623 | \n", "
776096 | \n", "94076001 | \n", "0.536119 | \n", "NaN | \n", "3.0 | \n", "3.0 | \n", "93461889 | \n", "- | \n", "118572970 | \n", "2971 | \n", "2968 | \n", "... | \n", "24496969 | \n", "745 | \n", "746 | \n", "ENSG00000187398 | \n", "protein_coding | \n", "Q86TE4 | \n", "0.343931 | \n", "346.0 | \n", "chr11 | \n", "2623 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
777091 | \n", "95714062 | \n", "0.134364 | \n", "NaN | \n", "5.0 | \n", "4.0 | \n", "95147696 | \n", "+ | \n", "120211031 | \n", "3051 | \n", "3051 | \n", "... | \n", "24496969 | \n", "745 | \n", "746 | \n", "ENSG00000187398 | \n", "protein_coding | \n", "Q86TE4 | \n", "0.343931 | \n", "346.0 | \n", "chr11 | \n", "2623 | \n", "
777092 | \n", "13745724 | \n", "0.354023 | \n", "NaN | \n", "57.0 | \n", "4.0 | \n", "14281013 | \n", "+ | \n", "10751245 | \n", "509 | \n", "511 | \n", "... | \n", "24496969 | \n", "745 | \n", "746 | \n", "ENSG00000187398 | \n", "protein_coding | \n", "Q86TE4 | \n", "0.343931 | \n", "346.0 | \n", "chr11 | \n", "2623 | \n", "
777093 | \n", "13143719 | \n", "0.107614 | \n", "NaN | \n", "72.0 | \n", "4.0 | \n", "13730697 | \n", "- | \n", "11353250 | \n", "522 | \n", "522 | \n", "... | \n", "24496969 | \n", "745 | \n", "746 | \n", "ENSG00000187398 | \n", "protein_coding | \n", "Q86TE4 | \n", "0.343931 | \n", "346.0 | \n", "chr11 | \n", "2623 | \n", "
777094 | \n", "93728125 | \n", "0.103446 | \n", "NaN | \n", "3.0 | \n", "4.0 | \n", "93111086 | \n", "- | \n", "118225094 | \n", "2951 | \n", "2950 | \n", "... | \n", "24496969 | \n", "745 | \n", "746 | \n", "ENSG00000187398 | \n", "protein_coding | \n", "Q86TE4 | \n", "0.343931 | \n", "346.0 | \n", "chr11 | \n", "2623 | \n", "
777095 | \n", "33254812 | \n", "0.214934 | \n", "NaN | \n", "45.0 | \n", "4.0 | \n", "32660875 | \n", "- | \n", "57751781 | \n", "1349 | \n", "1347 | \n", "... | \n", "24496969 | \n", "745 | \n", "746 | \n", "ENSG00000187398 | \n", "protein_coding | \n", "Q86TE4 | \n", "0.343931 | \n", "346.0 | \n", "chr11 | \n", "2623 | \n", "
1004 rows × 28 columns
\n", "txStart_outer_y | \n", "139612 | \n", "196737 | \n", "207428 | \n", "207510 | \n", "236931 | \n", "236965 | \n", "278364 | \n", "289125 | \n", "307630 | \n", "313505 | \n", "... | \n", "134069070 | \n", "134224670 | \n", "134225454 | \n", "134253370 | \n", "134253494 | \n", "134274244 | \n", "134331873 | \n", "134412242 | \n", "134412283 | \n", "134735595 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
txStart_outer_x | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
139612 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "... | \n", "73.0 | \n", "86.0 | \n", "86.0 | \n", "86.0 | \n", "86.0 | \n", "86.0 | \n", "77.0 | \n", "77.0 | \n", "77.0 | \n", "106.0 | \n", "
196737 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "... | \n", "73.0 | \n", "86.0 | \n", "86.0 | \n", "86.0 | \n", "86.0 | \n", "86.0 | \n", "77.0 | \n", "77.0 | \n", "77.0 | \n", "106.0 | \n", "
207428 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "... | \n", "57.0 | \n", "72.0 | \n", "72.0 | \n", "57.0 | \n", "57.0 | \n", "57.0 | \n", "40.0 | \n", "40.0 | \n", "40.0 | \n", "56.0 | \n", "
207510 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "... | \n", "57.0 | \n", "72.0 | \n", "72.0 | \n", "57.0 | \n", "57.0 | \n", "57.0 | \n", "40.0 | \n", "40.0 | \n", "40.0 | \n", "56.0 | \n", "
236931 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "... | \n", "57.0 | \n", "72.0 | \n", "72.0 | \n", "57.0 | \n", "57.0 | \n", "57.0 | \n", "40.0 | \n", "40.0 | \n", "40.0 | \n", "56.0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
22338380 | \n", "22.0 | \n", "22.0 | \n", "25.0 | \n", "25.0 | \n", "25.0 | \n", "25.0 | \n", "25.0 | \n", "25.0 | \n", "20.0 | \n", "20.0 | \n", "... | \n", "17.0 | \n", "17.0 | \n", "17.0 | \n", "14.0 | \n", "14.0 | \n", "14.0 | \n", "14.0 | \n", "14.0 | \n", "14.0 | \n", "17.0 | \n", "
22625508 | \n", "47.0 | \n", "47.0 | \n", "50.0 | \n", "50.0 | \n", "50.0 | \n", "50.0 | \n", "50.0 | \n", "50.0 | \n", "41.0 | \n", "41.0 | \n", "... | \n", "19.0 | \n", "25.0 | \n", "25.0 | \n", "19.0 | \n", "19.0 | \n", "19.0 | \n", "12.0 | \n", "12.0 | \n", "12.0 | \n", "13.0 | \n", "
22625841 | \n", "47.0 | \n", "47.0 | \n", "50.0 | \n", "50.0 | \n", "50.0 | \n", "50.0 | \n", "50.0 | \n", "50.0 | \n", "41.0 | \n", "41.0 | \n", "... | \n", "19.0 | \n", "25.0 | \n", "25.0 | \n", "19.0 | \n", "19.0 | \n", "19.0 | \n", "12.0 | \n", "12.0 | \n", "12.0 | \n", "13.0 | \n", "
22830299 | \n", "28.0 | \n", "28.0 | \n", "25.0 | \n", "25.0 | \n", "25.0 | \n", "25.0 | \n", "25.0 | \n", "25.0 | \n", "27.0 | \n", "27.0 | \n", "... | \n", "17.0 | \n", "18.0 | \n", "18.0 | \n", "15.0 | \n", "15.0 | \n", "15.0 | \n", "14.0 | \n", "14.0 | \n", "14.0 | \n", "22.0 | \n", "
24496969 | \n", "17.0 | \n", "17.0 | \n", "21.0 | \n", "21.0 | \n", "21.0 | \n", "21.0 | \n", "21.0 | \n", "21.0 | \n", "18.0 | \n", "18.0 | \n", "... | \n", "14.0 | \n", "14.0 | \n", "14.0 | \n", "14.0 | \n", "14.0 | \n", "14.0 | \n", "12.0 | \n", "12.0 | \n", "12.0 | \n", "22.0 | \n", "
220 rows × 1002 columns
\n", "txStart_outer_y | \n", "778626 | \n", "825137 | \n", "911434 | \n", "923927 | \n", "959309 | \n", "960583 | \n", "966481 | \n", "982093 | \n", "1000172 | \n", "1001137 | \n", "... | \n", "247458105 | \n", "247507057 | \n", "247857186 | \n", "247895586 | \n", "248030069 | \n", "248095183 | \n", "248825915 | \n", "248838209 | \n", "248859144 | \n", "248906195 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
txStart_outer_x | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
778626 | \n", "1.000000 | \n", "0.795363 | \n", "0.542804 | \n", "0.451949 | \n", "0.833483 | \n", "0.867955 | \n", "0.583312 | \n", "0.434424 | \n", "0.403705 | \n", "0.242381 | \n", "... | \n", "0.302802 | \n", "0.408970 | \n", "0.508224 | \n", "0.294071 | \n", "0.313602 | \n", "0.160920 | \n", "0.896949 | \n", "0.763754 | \n", "0.932846 | \n", "0.862231 | \n", "
825137 | \n", "0.795363 | \n", "1.000000 | \n", "0.419972 | \n", "0.456052 | \n", "0.952361 | \n", "0.895054 | \n", "0.455271 | \n", "0.445425 | \n", "0.530916 | \n", "0.399459 | \n", "... | \n", "0.219729 | \n", "0.503699 | \n", "0.661096 | \n", "0.479318 | \n", "0.395441 | \n", "0.427875 | \n", "0.891803 | \n", "0.935640 | \n", "0.886646 | \n", "0.933684 | \n", "
911434 | \n", "0.542804 | \n", "0.419972 | \n", "1.000000 | \n", "0.652653 | \n", "0.521039 | \n", "0.527501 | \n", "0.410617 | \n", "0.228461 | \n", "0.253063 | \n", "0.077471 | \n", "... | \n", "0.080981 | \n", "0.088441 | \n", "0.253435 | \n", "0.283873 | \n", "0.085861 | \n", "0.082822 | \n", "0.416658 | \n", "0.378583 | \n", "0.455301 | \n", "0.338369 | \n", "
923927 | \n", "0.451949 | \n", "0.456052 | \n", "0.652653 | \n", "1.000000 | \n", "0.656982 | \n", "0.712637 | \n", "0.459915 | \n", "0.369399 | \n", "0.514615 | \n", "0.302695 | \n", "... | \n", "0.073340 | \n", "0.166112 | \n", "0.220809 | \n", "0.073019 | \n", "0.034468 | \n", "0.082952 | \n", "0.525138 | \n", "0.672329 | \n", "0.669089 | \n", "0.519295 | \n", "
959309 | \n", "0.833483 | \n", "0.952361 | \n", "0.521039 | \n", "0.656982 | \n", "1.000000 | \n", "0.986988 | \n", "0.840109 | \n", "0.699588 | \n", "0.816809 | \n", "0.837351 | \n", "... | \n", "0.217908 | \n", "0.365334 | \n", "0.732293 | \n", "0.581978 | \n", "0.160844 | \n", "0.239354 | \n", "0.977070 | \n", "0.998953 | \n", "0.979892 | \n", "0.960807 | \n", "
960583 | \n", "0.867955 | \n", "0.895054 | \n", "0.527501 | \n", "0.712637 | \n", "0.986988 | \n", "1.000000 | \n", "0.860053 | \n", "0.734980 | \n", "0.829764 | \n", "0.794470 | \n", "... | \n", "0.205503 | \n", "0.345161 | \n", "0.476788 | \n", "0.470601 | \n", "0.210881 | \n", "0.133548 | \n", "0.959885 | \n", "0.953686 | \n", "0.995867 | \n", "0.928330 | \n", "
966481 | \n", "0.583312 | \n", "0.455271 | \n", "0.410617 | \n", "0.459915 | \n", "0.840109 | \n", "0.860053 | \n", "1.000000 | \n", "0.898037 | \n", "0.820914 | \n", "0.758308 | \n", "... | \n", "0.157921 | \n", "0.098106 | \n", "0.216357 | \n", "0.081204 | \n", "0.034149 | \n", "0.003445 | \n", "0.664612 | \n", "0.824771 | \n", "0.744605 | \n", "0.512252 | \n", "
982093 | \n", "0.434424 | \n", "0.445425 | \n", "0.228461 | \n", "0.369399 | \n", "0.699588 | \n", "0.734980 | \n", "0.898037 | \n", "1.000000 | \n", "0.788004 | \n", "0.527765 | \n", "... | \n", "0.056539 | \n", "0.074405 | \n", "0.140551 | \n", "0.112722 | \n", "0.005566 | \n", "0.004332 | \n", "0.565241 | \n", "0.676115 | \n", "0.600830 | \n", "0.299363 | \n", "
8 rows × 1806 columns
\n", "\n", " | chrm | \n", "num_pairs | \n", "dist_thresh | \n", "auc | \n", "plot | \n", "pr_curve | \n", "true_pos | \n", "true_neg | \n", "exp_median | \n", "exp_mean | \n", "exp_var | \n", "Gene stable ID | \n", "mp_precited | \n", "auc_or | \n", "auc_hic | \n", "p_val | \n", "samples | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
62186 | \n", "chr11 | \n", "1004 | \n", "1 | \n", "0.901408 | \n", "{} | \n", "{} | \n", "710 | \n", "1 | \n", "0.589374 | \n", "0.545647 | \n", "0.052450 | \n", "ENSG00000187049 | \n", "ENSG00000149311 | \n", "0.992958 | \n", "0.547183 | \n", "0.029412 | \n", "272 | \n", "
62190 | \n", "chr11 | \n", "1004 | \n", "1 | \n", "0.901408 | \n", "{} | \n", "{} | \n", "710 | \n", "1 | \n", "0.589374 | \n", "0.545647 | \n", "0.052450 | \n", "ENSG00000187049 | \n", "ENSG00000150433 | \n", "0.992958 | \n", "0.432394 | \n", "0.029412 | \n", "272 | \n", "
62191 | \n", "chr11 | \n", "1004 | \n", "1 | \n", "0.901408 | \n", "{} | \n", "{} | \n", "710 | \n", "1 | \n", "0.589374 | \n", "0.545647 | \n", "0.052450 | \n", "ENSG00000187049 | \n", "ENSG00000149289 | \n", "0.992958 | \n", "0.383099 | \n", "0.029412 | \n", "272 | \n", "
62193 | \n", "chr11 | \n", "1004 | \n", "1 | \n", "0.901408 | \n", "{} | \n", "{} | \n", "710 | \n", "1 | \n", "0.589374 | \n", "0.545647 | \n", "0.052450 | \n", "ENSG00000187049 | \n", "ENSG00000149557 | \n", "0.992958 | \n", "0.681690 | \n", "0.029412 | \n", "272 | \n", "
62194 | \n", "chr11 | \n", "1004 | \n", "1 | \n", "0.901408 | \n", "{} | \n", "{} | \n", "710 | \n", "1 | \n", "0.589374 | \n", "0.545647 | \n", "0.052450 | \n", "ENSG00000187049 | \n", "ENSG00000166086 | \n", "0.992958 | \n", "0.526056 | \n", "0.029412 | \n", "272 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
999978 | \n", "chr11 | \n", "1004 | \n", "1 | \n", "0.901408 | \n", "{} | \n", "{} | \n", "710 | \n", "1 | \n", "0.589374 | \n", "0.545647 | \n", "0.052450 | \n", "ENSG00000162144 | \n", "ENSG00000196371 | \n", "0.964789 | \n", "0.043662 | \n", "0.000000 | \n", "272 | \n", "
999979 | \n", "chr11 | \n", "1004 | \n", "1 | \n", "0.901408 | \n", "{} | \n", "{} | \n", "710 | \n", "1 | \n", "0.589374 | \n", "0.545647 | \n", "0.052450 | \n", "ENSG00000162144 | \n", "ENSG00000137710 | \n", "0.964789 | \n", "0.427465 | \n", "0.000000 | \n", "272 | \n", "
999982 | \n", "chr11 | \n", "1004 | \n", "1 | \n", "0.901408 | \n", "{} | \n", "{} | \n", "710 | \n", "1 | \n", "0.589374 | \n", "0.545647 | \n", "0.052450 | \n", "ENSG00000162144 | \n", "ENSG00000214376 | \n", "0.964789 | \n", "0.036620 | \n", "0.000000 | \n", "272 | \n", "
999985 | \n", "chr11 | \n", "1004 | \n", "1 | \n", "0.940845 | \n", "{} | \n", "{} | \n", "710 | \n", "1 | \n", "0.633611 | \n", "0.578590 | \n", "0.074277 | \n", "ENSG00000162144 | \n", "ENSG00000110218 | \n", "0.964789 | \n", "0.039437 | \n", "0.000000 | \n", "272 | \n", "
999990 | \n", "chr11 | \n", "1004 | \n", "1 | \n", "0.901408 | \n", "{} | \n", "{} | \n", "710 | \n", "1 | \n", "0.589374 | \n", "0.545647 | \n", "0.052450 | \n", "ENSG00000162144 | \n", "ENSG00000064199 | \n", "0.964789 | \n", "0.404225 | \n", "0.000000 | \n", "272 | \n", "
12115 rows × 17 columns
\n", "\n", " | chrm | \n", "num_pairs | \n", "dist_thresh | \n", "auc | \n", "plot | \n", "pr_curve | \n", "true_pos | \n", "true_neg | \n", "exp_median | \n", "exp_mean | \n", "exp_var | \n", "Gene stable ID | \n", "mp_precited | \n", "auc_or | \n", "auc_hic | \n", "p_val | \n", "samples | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
12 | \n", "chr11 | \n", "1004 | \n", "1 | \n", "0.758698 | \n", "{} | \n", "{} | \n", "891 | \n", "1 | \n", "0.121187 | \n", "0.128362 | \n", "0.007605 | \n", "ENSG00000149311 | \n", "ENSG00000244734 | \n", "0.933782 | \n", "0.203143 | \n", "0.425076 | \n", "327 | \n", "
13 | \n", "chr11 | \n", "1004 | \n", "1 | \n", "0.753086 | \n", "{} | \n", "{} | \n", "891 | \n", "1 | \n", "0.181077 | \n", "0.197166 | \n", "0.014144 | \n", "ENSG00000149311 | \n", "ENSG00000188124 | \n", "0.933782 | \n", "0.258137 | \n", "0.425076 | \n", "327 | \n", "
16 | \n", "chr11 | \n", "1004 | \n", "1 | \n", "0.739618 | \n", "{} | \n", "{} | \n", "891 | \n", "1 | \n", "0.575126 | \n", "0.521568 | \n", "0.044223 | \n", "ENSG00000149311 | \n", "ENSG00000149294 | \n", "0.933782 | \n", "0.459035 | \n", "0.425076 | \n", "327 | \n", "
21 | \n", "chr11 | \n", "1004 | \n", "1 | \n", "0.955107 | \n", "{} | \n", "{} | \n", "891 | \n", "1 | \n", "0.709154 | \n", "0.637962 | \n", "0.078983 | \n", "ENSG00000149311 | \n", "ENSG00000149089 | \n", "0.933782 | \n", "0.158249 | \n", "0.425076 | \n", "327 | \n", "
25 | \n", "chr11 | \n", "1004 | \n", "1 | \n", "0.976431 | \n", "{} | \n", "{} | \n", "891 | \n", "1 | \n", "0.623800 | \n", "0.579748 | \n", "0.052413 | \n", "ENSG00000149311 | \n", "ENSG00000179532 | \n", "0.933782 | \n", "0.355780 | \n", "0.425076 | \n", "327 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
1006993 | \n", "chr11 | \n", "1004 | \n", "1 | \n", "0.828671 | \n", "{} | \n", "{} | \n", "858 | \n", "1 | \n", "0.590600 | \n", "0.544989 | \n", "0.049380 | \n", "ENSG00000064199 | \n", "ENSG00000171202 | \n", "0.828671 | \n", "0.444639 | \n", "1.000000 | \n", "356 | \n", "
1006996 | \n", "chr11 | \n", "1004 | \n", "1 | \n", "0.828671 | \n", "{} | \n", "{} | \n", "858 | \n", "1 | \n", "0.590600 | \n", "0.544989 | \n", "0.049380 | \n", "ENSG00000064199 | \n", "ENSG00000183801 | \n", "0.828671 | \n", "0.414918 | \n", "1.000000 | \n", "356 | \n", "
1007003 | \n", "chr11 | \n", "1004 | \n", "1 | \n", "0.828671 | \n", "{} | \n", "{} | \n", "858 | \n", "1 | \n", "0.590600 | \n", "0.544989 | \n", "0.049380 | \n", "ENSG00000064199 | \n", "ENSG00000214376 | \n", "0.828671 | \n", "0.635781 | \n", "1.000000 | \n", "356 | \n", "
1007007 | \n", "chr11 | \n", "1004 | \n", "1 | \n", "0.828671 | \n", "{} | \n", "{} | \n", "858 | \n", "1 | \n", "0.590600 | \n", "0.544989 | \n", "0.049380 | \n", "ENSG00000064199 | \n", "ENSG00000110218 | \n", "0.828671 | \n", "0.329837 | \n", "1.000000 | \n", "356 | \n", "
1007008 | \n", "chr11 | \n", "1004 | \n", "1 | \n", "0.828671 | \n", "{} | \n", "{} | \n", "858 | \n", "1 | \n", "0.590600 | \n", "0.544989 | \n", "0.049380 | \n", "ENSG00000064199 | \n", "ENSG00000196778 | \n", "0.828671 | \n", "0.314685 | \n", "1.000000 | \n", "356 | \n", "
297125 rows × 17 columns
\n", "\n", " | chrm | \n", "variable | \n", "value | \n", "
---|---|---|---|
0 | \n", "chr11 | \n", "auc | \n", "0.758698 | \n", "
1 | \n", "chr11 | \n", "auc | \n", "0.753086 | \n", "
2 | \n", "chr11 | \n", "auc | \n", "0.739618 | \n", "
3 | \n", "chr11 | \n", "auc | \n", "0.955107 | \n", "
4 | \n", "chr11 | \n", "auc | \n", "0.976431 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "
536191 | \n", "chr11 | \n", "auc_or | \n", "0.828671 | \n", "
536192 | \n", "chr11 | \n", "auc_or | \n", "0.828671 | \n", "
536193 | \n", "chr11 | \n", "auc_or | \n", "0.828671 | \n", "
536194 | \n", "chr11 | \n", "auc_or | \n", "0.828671 | \n", "
536195 | \n", "chr11 | \n", "auc_or | \n", "0.828671 | \n", "
536196 rows × 3 columns
\n", "