{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
CategoryCountGC content
EnzymeImProm-II 42CImProm-II 55CSuperScriptIVTGIRTImProm-II 42CImProm-II 55CSuperScriptIVTGIRT
Low abundance2882392302110.5000000.5000000.5000000.500000
Verrucomicrobiae1310620139110290.5344860.5333330.5323150.532096
Unclassified12111210129212160.4927660.5077560.5052670.503933
Alphaproteobacteria12943930212148123850.5548350.5534260.5626060.563610
Deltaproteobacteria43302154314130010.5639300.5660200.5652180.565658
Gammaproteobacteria59677610279325760.5430560.5368290.5442280.545745
Planctomycetacia3577102472830.5982060.6247580.6071470.619704
Phycisphaerae10112818170.5765350.5731420.5727570.577386
Saccharimonadia1305749300.5030400.5017560.4960030.496590
Longimicrobia3282172131970.6151910.6160980.6153480.614556
Gemmatimonadetes5325915184630.6260240.6290100.6260450.628619
BD2-11263348420.6098610.6102530.6088900.610935
S013411675731140.5891860.6030750.5995250.598523
Nitrospira323474700.6007360.5995530.5995220.599818
Bacilli13566566635200.5228740.5337930.5312690.537584
Fibrobacteria453546360.5544490.5548410.5538320.553822
Entotheonellia1251222211640.5767940.5766640.5762620.575045
Deinococci892844290.5653570.5742200.5613800.564073
Oxyphotobacteria279896217118770.5460750.5447380.5460600.545485
Chloroflexia4418256667890.6391460.6447710.6396640.640914
Anaerolineae191175113890.5523750.5594230.5612380.564171
Gitt-GS-1362701712392740.5609480.5618900.5610700.560207
JG30-KF-CM66761451751750.5967720.5974730.5970700.597318
KD4-962982643704060.5696510.5693400.5692420.568869
TK102755835226110.6148150.6286710.6184170.616980
Ktedonobacteria264161520.5786460.5789460.5805070.580245
Dehalococcoidia7098155970.5781480.5778600.5775430.578580
Bacteroidia28251817230730050.5143520.5143830.5137380.508924
Fimbriimonadia692932430.5424530.5433260.5368590.541226
uncultured416631280.6087570.6126510.6111160.616270
Actinobacteria58641126310105113530.5833210.5838050.5847250.586320
Acidimicrobiia12031617151818580.5852210.5866620.5881910.587488
Thermoleophilia27454643373335620.5890960.5889530.5894920.589915
0319-7L145274423323920.5807500.5829870.5812330.582942
Nitriliruptoria2533804104080.5765690.5786540.5768600.577517
Rubrobacteria13511505238019740.5976080.6003720.6010170.601583
MB-A2-1086110167990.6089170.6085270.6082360.605956
Thermoanaerobaculia1171271221460.5822420.5828200.5830030.582521
Subgroup3852846815010.5801260.5806210.5797170.580671
Holophagae2351393081910.5672140.5666780.5680340.568013
Blastocatellia3362433093280.5435840.5464200.5481640.549827
Acidobacteriia2572594443590.5557910.5617080.5618130.559804
\n", "
" ], "text/plain": [ "Category Count \\\n", "Enzyme ImProm-II 42C ImProm-II 55C SuperScriptIV TGIRT \n", "Low abundance 288 239 230 211 \n", "Verrucomicrobiae 1310 620 1391 1029 \n", "Unclassified 1211 1210 1292 1216 \n", "Alphaproteobacteria 12943 9302 12148 12385 \n", "Deltaproteobacteria 4330 2154 3141 3001 \n", "Gammaproteobacteria 5967 7610 2793 2576 \n", "Planctomycetacia 357 710 247 283 \n", "Phycisphaerae 101 128 18 17 \n", "Saccharimonadia 130 57 49 30 \n", "Longimicrobia 328 217 213 197 \n", "Gemmatimonadetes 532 591 518 463 \n", "BD2-11 26 33 48 42 \n", "S0134 116 75 73 114 \n", "Nitrospira 32 34 74 70 \n", "Bacilli 1356 656 663 520 \n", "Fibrobacteria 45 35 46 36 \n", "Entotheonellia 125 122 221 164 \n", "Deinococci 89 28 44 29 \n", "Oxyphotobacteria 2798 962 1711 877 \n", "Chloroflexia 441 825 666 789 \n", "Anaerolineae 191 175 113 89 \n", "Gitt-GS-136 270 171 239 274 \n", "JG30-KF-CM66 76 145 175 175 \n", "KD4-96 298 264 370 406 \n", "TK10 275 583 522 611 \n", "Ktedonobacteria 26 41 61 52 \n", "Dehalococcoidia 70 98 155 97 \n", "Bacteroidia 2825 1817 2307 3005 \n", "Fimbriimonadia 69 29 32 43 \n", "uncultured 41 66 31 28 \n", "Actinobacteria 5864 11263 10105 11353 \n", "Acidimicrobiia 1203 1617 1518 1858 \n", "Thermoleophilia 2745 4643 3733 3562 \n", "0319-7L14 527 442 332 392 \n", "Nitriliruptoria 253 380 410 408 \n", "Rubrobacteria 1351 1505 2380 1974 \n", "MB-A2-108 61 101 67 99 \n", "Thermoanaerobaculia 117 127 122 146 \n", "Subgroup 385 284 681 501 \n", "Holophagae 235 139 308 191 \n", "Blastocatellia 336 243 309 328 \n", "Acidobacteriia 257 259 444 359 \n", "\n", "Category GC content \n", "Enzyme ImProm-II 42C ImProm-II 55C SuperScriptIV TGIRT \n", "Low abundance 0.500000 0.500000 0.500000 0.500000 \n", "Verrucomicrobiae 0.534486 0.533333 0.532315 0.532096 \n", "Unclassified 0.492766 0.507756 0.505267 0.503933 \n", "Alphaproteobacteria 0.554835 0.553426 0.562606 0.563610 \n", "Deltaproteobacteria 0.563930 0.566020 0.565218 0.565658 \n", "Gammaproteobacteria 0.543056 0.536829 0.544228 0.545745 \n", "Planctomycetacia 0.598206 0.624758 0.607147 0.619704 \n", "Phycisphaerae 0.576535 0.573142 0.572757 0.577386 \n", "Saccharimonadia 0.503040 0.501756 0.496003 0.496590 \n", "Longimicrobia 0.615191 0.616098 0.615348 0.614556 \n", "Gemmatimonadetes 0.626024 0.629010 0.626045 0.628619 \n", "BD2-11 0.609861 0.610253 0.608890 0.610935 \n", "S0134 0.589186 0.603075 0.599525 0.598523 \n", "Nitrospira 0.600736 0.599553 0.599522 0.599818 \n", "Bacilli 0.522874 0.533793 0.531269 0.537584 \n", "Fibrobacteria 0.554449 0.554841 0.553832 0.553822 \n", "Entotheonellia 0.576794 0.576664 0.576262 0.575045 \n", "Deinococci 0.565357 0.574220 0.561380 0.564073 \n", "Oxyphotobacteria 0.546075 0.544738 0.546060 0.545485 \n", "Chloroflexia 0.639146 0.644771 0.639664 0.640914 \n", "Anaerolineae 0.552375 0.559423 0.561238 0.564171 \n", "Gitt-GS-136 0.560948 0.561890 0.561070 0.560207 \n", "JG30-KF-CM66 0.596772 0.597473 0.597070 0.597318 \n", "KD4-96 0.569651 0.569340 0.569242 0.568869 \n", "TK10 0.614815 0.628671 0.618417 0.616980 \n", "Ktedonobacteria 0.578646 0.578946 0.580507 0.580245 \n", "Dehalococcoidia 0.578148 0.577860 0.577543 0.578580 \n", "Bacteroidia 0.514352 0.514383 0.513738 0.508924 \n", "Fimbriimonadia 0.542453 0.543326 0.536859 0.541226 \n", "uncultured 0.608757 0.612651 0.611116 0.616270 \n", "Actinobacteria 0.583321 0.583805 0.584725 0.586320 \n", "Acidimicrobiia 0.585221 0.586662 0.588191 0.587488 \n", "Thermoleophilia 0.589096 0.588953 0.589492 0.589915 \n", "0319-7L14 0.580750 0.582987 0.581233 0.582942 \n", "Nitriliruptoria 0.576569 0.578654 0.576860 0.577517 \n", "Rubrobacteria 0.597608 0.600372 0.601017 0.601583 \n", "MB-A2-108 0.608917 0.608527 0.608236 0.605956 \n", "Thermoanaerobaculia 0.582242 0.582820 0.583003 0.582521 \n", "Subgroup 0.580126 0.580621 0.579717 0.580671 \n", "Holophagae 0.567214 0.566678 0.568034 0.568013 \n", "Blastocatellia 0.543584 0.546420 0.548164 0.549827 \n", "Acidobacteriia 0.555791 0.561708 0.561813 0.559804 " ] }, "execution_count": 1, "metadata": {}, "output_type": "execute_result" } ], "source": [ "import pandas as pd\n", "\n", "df1 = pd.read_csv(\"GC_class_forFigure_ordered.csv\", header=[0,1], index_col=0)\n", "df1.columns.names = [\"Category\", \"Enzyme\"]\n", "df1" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "|Enzyme |TGIRT |SuperScriptIV|Promega42 |Promega55|\n", "|:-------------|:-----:|:-----------:|:---------:|:-------:|\n", "|TGIRT | x | TvS | Tv42 | Tv55 | \n", "|SuperScriptIV | TvS | x | Sv42 | Sv55 |\n", "|Promega42 | Tv42 | Sv42 | x | P42v55 |\n", "|Promega55 | Tv55 | Sv55 | P42v55 | x |" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [], "source": [ "def relativeEnrichment(a, b):\n", " return (a-b)/(a+b)" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [], "source": [ "idx = pd.IndexSlice\n", "\n", "TvS = relativeEnrichment(df1.loc[:, idx[\"Count\", \"TGIRT\"]], df1.loc[:, idx[\"Count\", \"SuperScriptIV\"]])\n", "df1[\"Comparison\", \"TvS\"] = TvS\n", "\n", "Tv42 = relativeEnrichment(df1.loc[:, idx[\"Count\", \"TGIRT\"]], df1.loc[:, idx[\"Count\", \"ImProm-II 42C\"]])\n", "df1[\"Comparison\", \"Tv42\"] = Tv42\n", "\n", "Tv55 = relativeEnrichment(df1.loc[:, idx[\"Count\", \"TGIRT\"]], df1.loc[:, idx[\"Count\", \"ImProm-II 55C\"]])\n", "df1[\"Comparison\", \"Tv55\"] = Tv55\n", "\n", "Sv42 = relativeEnrichment(df1.loc[:, idx[\"Count\", \"SuperScriptIV\"]], df1.loc[:, idx[\"Count\", \"ImProm-II 42C\"]])\n", "df1[\"Comparison\", \"Sv42\"] = Sv42\n", "\n", "Sv55 = relativeEnrichment(df1.loc[:, idx[\"Count\", \"SuperScriptIV\"]], df1.loc[:, idx[\"Count\", \"ImProm-II 55C\"]])\n", "df1[\"Comparison\", \"Sv55\"] = Sv55\n", "\n", "P42v55 = relativeEnrichment(df1.loc[:, idx[\"Count\", \"ImProm-II 42C\"]], df1.loc[:, idx[\"Count\", \"ImProm-II 55C\"]])\n", "df1[\"Comparison\", \"P42v55\"] = P42v55" ] }, { "cell_type": "code", "execution_count": 11, "metadata": {}, "outputs": [], "source": [ "import matplotlib.pyplot as plt\n", "from matplotlib import cm\n", "import numpy as np\n", "\n", "default_dpi = plt.rcParamsDefault[\"figure.dpi\"]\n", "plt.rcParams[\"figure.figsize\"] = [6,8]\n", "\n", "def barplotFigure(y, GC_content, name):\n", " # Bar position\n", " x_pos = np.arange(len(y))\n", " # \"Stretching\" color values betwenn 0 and 1 to get the best colourfulness\n", " col_norm =(GC_content-min(GC_content))/(max(GC_content-min(GC_content)))\n", " # Getting color pallette\n", " colors = cm.viridis(col_norm)\n", " \n", " # Legend construction\n", " plot = plt.scatter(GC_content, GC_content, c=GC_content, cmap=\"viridis\")\n", " plt.clf()\n", " plt.colorbar(plot)\n", "\n", " # Barplot \n", " plt.barh(x_pos, y, color=colors, align=\"center\")\n", " plt.yticks(x_pos, df1.index.values)\n", " plt.title(name)\n", " \n", " axes = plt.gca()\n", " axes.set_xlim([-0.8,0.8])\n", " \n", " plt.savefig(name+\".pdf\", bbox_inches=\"tight\")" ] }, { "cell_type": "code", "execution_count": 14, "metadata": {}, "outputs": [ { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "name = \"SuperScriptIV : TGIRT \" \n", "barplotFigure(y=df1[\"Comparison\", \"TvS\"], GC_content=df1[\"GC content\", \"TGIRT\"], name=name)\n", "\n", "name = \"ImProm-II 42°C : TGIRT \" \n", "barplotFigure(y=df1[\"Comparison\", \"Tv42\"], GC_content=df1[\"GC content\", \"ImProm-II 42C\"], name=name)\n", "\n", "name = \"ImProm-II 55°C : TGIRT \" \n", "barplotFigure(y=df1[\"Comparison\", \"Tv55\"], GC_content=df1[\"GC content\", \"ImProm-II 55C\"], name=name)\n", "\n", "name = \"ImProm-II 42°C : SuperScriptIV \" \n", "barplotFigure(y=df1[\"Comparison\", \"Sv42\"], GC_content=df1[\"GC content\", \"ImProm-II 42C\"], name=name)\n", "\n", "name = \"ImProm-II 55°C : SuperScriptIV \" \n", "barplotFigure(y=df1[\"Comparison\", \"Sv55\"], GC_content=df1[\"GC content\", \"ImProm-II 55C\"], name=name)\n", "\n", "name = \"ImProm-II 55°C : ImProm-II 42°C\" \n", "barplotFigure(y=df1[\"Comparison\", \"P42v55\"], GC_content=df1[\"GC content\", \"ImProm-II 42C\"], name=name)" ] } ], "metadata": { "kernelspec": { "display_name": "Python 3", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.6.8" } }, "nbformat": 4, "nbformat_minor": 2 }