{ "cells": [ { "cell_type": "code", "execution_count": 27, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
CategoryAverageStdDevGC content
EnzymeImProm-II 42CImProm-II 55CSuperScriptIVTGIRTImProm-II 42CImProm-II 55CSuperScriptIVTGIRTImProm-II 42CImProm-II 55CSuperScriptIVTGIRT
Low abundance28823923021168.92516552.14258935.39258232.7022590.5000000.5000000.5000000.500000
Verrucomicrobiae13106201391102984.88227143.312816112.83926649.7262510.5344860.5333330.5323150.532096
Unclassified121112101292121640.94752721.50581333.32866640.1335270.4927660.5077560.5052670.503933
Alphaproteobacteria1294393021214812385481.747652232.488279303.496787382.1884350.5548350.5534260.5626060.563610
Deltaproteobacteria4330215431413001440.766945215.61238478.34985648.8640970.5639300.5660200.5652180.565658
Gammaproteobacteria5967761027932576556.201672552.65359980.198504162.0808440.5430560.5368290.5442280.545745
Planctomycetacia35771024728320.32978150.90677816.57709316.5317880.5982060.6247580.6071470.619704
Phycisphaerae10112818175.63027511.0589333.0495901.3416410.5765350.5731420.5727570.577386
Saccharimonadia13057493019.7989904.39317716.4529639.1104340.5030400.5017560.4960030.496590
Longimicrobia32821721319736.95673112.19836125.51078219.1650720.6151910.6160980.6153480.614556
Gemmatimonadetes532591518463111.57643177.212046105.991981106.9242720.6260240.6290100.6260450.628619
BD2-11263348425.7619447.9874908.8204316.7305270.6098610.6102530.6088900.610935
S0134116757311432.64506113.61983818.79627630.6545270.5891860.6030750.5995250.598523
Nitrospira323474704.0373263.7682899.8081608.6890740.6007360.5995530.5995220.599818
Bacilli1356656663520133.78415560.87035474.75158965.0768780.5228740.5337930.5312690.537584
Fibrobacteria453546363.0000003.0822072.4899802.9495760.5544490.5548410.5538320.553822
Entotheonellia12512222116423.43074922.07487334.62946723.4882950.5767940.5766640.5762620.575045
Deinococci8928442919.9173292.9664794.1472883.9623230.5653570.5742200.5613800.564073
Oxyphotobacteria27989621711877523.532520243.335776212.430459139.2634190.5460750.5447380.5460600.545485
Chloroflexia44182566678939.23263912.38951233.71498233.7298090.6391460.6447710.6396640.640914
Anaerolineae191175113897.5630688.09320712.7003945.8051700.5523750.5594230.5612380.564171
Gitt-GS-13627017123927432.89376825.67489016.51363114.8727940.5609480.5618900.5610700.560207
JG30-KF-CM667614517517511.27829814.35270012.8452337.2456880.5967720.5974730.5970700.597318
KD4-9629826437040621.17309612.19426135.68613226.4707390.5696510.5693400.5692420.568869
TK1027558352261125.95187945.97064338.44866743.8884950.6148150.6286710.6184170.616980
Ktedonobacteria264161523.5637064.4384684.0865635.3197740.5786460.5789460.5805070.580245
Dehalococcoidia7098155975.87367011.10405314.5258399.4762860.5781480.5778600.5775430.578580
Bacteroidia2825181723073005141.663333188.279845143.224649194.8037470.5143520.5143830.5137380.508924
Fimbriimonadia692932437.5960523.8340584.0987803.6469170.5424530.5433260.5368590.541226
uncultured416631284.4384683.4205261.9235382.7018510.6087570.6126510.6111160.616270
Acidobacteriia25725944435929.3649456.94262218.08867028.4552280.5557910.5617080.5618130.559804
Acidimicrobiia1203161715181858109.91724247.30010646.30118855.4102880.5852210.5866620.5881910.587488
Thermoleophilia2745464337333562254.825430135.417133190.525064174.3166660.5890960.5889530.5894920.589915
0319-7L1452744233239285.20739481.04196450.25733856.3897150.5807500.5829870.5812330.582942
Nitriliruptoria25338041040817.84096414.74788112.4096744.5607020.5765690.5786540.5768600.577517
Rubrobacteria135115052380197467.31047571.333723193.530359158.6764000.5976080.6003720.6010170.601583
MB-A2-10861101679914.75466018.6868943.4351134.1472880.6089170.6085270.6082360.605956
Thermoanaerobaculia11712712214611.43678310.28591311.56719516.2696040.5822420.5828200.5830030.582521
Subgroup38528468150151.20058637.03646944.54997242.7106540.5801260.5806210.5797170.580671
Holophagae23513930819125.41653014.30734112.09545436.8334090.5672140.5666780.5680340.568013
Blastocatellia33624330932831.54679114.87615533.89985336.9296630.5435840.5464200.5481640.549827
Actinobacteria5864112631010511353445.351771581.639321223.156895274.2969190.5833210.5838050.5847250.586320
\n", "
" ], "text/plain": [ "Category Average \\\n", "Enzyme ImProm-II 42C ImProm-II 55C SuperScriptIV TGIRT \n", "Low abundance 288 239 230 211 \n", "Verrucomicrobiae 1310 620 1391 1029 \n", "Unclassified 1211 1210 1292 1216 \n", "Alphaproteobacteria 12943 9302 12148 12385 \n", "Deltaproteobacteria 4330 2154 3141 3001 \n", "Gammaproteobacteria 5967 7610 2793 2576 \n", "Planctomycetacia 357 710 247 283 \n", "Phycisphaerae 101 128 18 17 \n", "Saccharimonadia 130 57 49 30 \n", "Longimicrobia 328 217 213 197 \n", "Gemmatimonadetes 532 591 518 463 \n", "BD2-11 26 33 48 42 \n", "S0134 116 75 73 114 \n", "Nitrospira 32 34 74 70 \n", "Bacilli 1356 656 663 520 \n", "Fibrobacteria 45 35 46 36 \n", "Entotheonellia 125 122 221 164 \n", "Deinococci 89 28 44 29 \n", "Oxyphotobacteria 2798 962 1711 877 \n", "Chloroflexia 441 825 666 789 \n", "Anaerolineae 191 175 113 89 \n", "Gitt-GS-136 270 171 239 274 \n", "JG30-KF-CM66 76 145 175 175 \n", "KD4-96 298 264 370 406 \n", "TK10 275 583 522 611 \n", "Ktedonobacteria 26 41 61 52 \n", "Dehalococcoidia 70 98 155 97 \n", "Bacteroidia 2825 1817 2307 3005 \n", "Fimbriimonadia 69 29 32 43 \n", "uncultured 41 66 31 28 \n", "Acidobacteriia 257 259 444 359 \n", "Acidimicrobiia 1203 1617 1518 1858 \n", "Thermoleophilia 2745 4643 3733 3562 \n", "0319-7L14 527 442 332 392 \n", "Nitriliruptoria 253 380 410 408 \n", "Rubrobacteria 1351 1505 2380 1974 \n", "MB-A2-108 61 101 67 99 \n", "Thermoanaerobaculia 117 127 122 146 \n", "Subgroup 385 284 681 501 \n", "Holophagae 235 139 308 191 \n", "Blastocatellia 336 243 309 328 \n", "Actinobacteria 5864 11263 10105 11353 \n", "\n", "Category StdDev \\\n", "Enzyme ImProm-II 42C ImProm-II 55C SuperScriptIV TGIRT \n", "Low abundance 68.925165 52.142589 35.392582 32.702259 \n", "Verrucomicrobiae 84.882271 43.312816 112.839266 49.726251 \n", "Unclassified 40.947527 21.505813 33.328666 40.133527 \n", "Alphaproteobacteria 481.747652 232.488279 303.496787 382.188435 \n", "Deltaproteobacteria 440.766945 215.612384 78.349856 48.864097 \n", "Gammaproteobacteria 556.201672 552.653599 80.198504 162.080844 \n", "Planctomycetacia 20.329781 50.906778 16.577093 16.531788 \n", "Phycisphaerae 5.630275 11.058933 3.049590 1.341641 \n", "Saccharimonadia 19.798990 4.393177 16.452963 9.110434 \n", "Longimicrobia 36.956731 12.198361 25.510782 19.165072 \n", "Gemmatimonadetes 111.576431 77.212046 105.991981 106.924272 \n", "BD2-11 5.761944 7.987490 8.820431 6.730527 \n", "S0134 32.645061 13.619838 18.796276 30.654527 \n", "Nitrospira 4.037326 3.768289 9.808160 8.689074 \n", "Bacilli 133.784155 60.870354 74.751589 65.076878 \n", "Fibrobacteria 3.000000 3.082207 2.489980 2.949576 \n", "Entotheonellia 23.430749 22.074873 34.629467 23.488295 \n", "Deinococci 19.917329 2.966479 4.147288 3.962323 \n", "Oxyphotobacteria 523.532520 243.335776 212.430459 139.263419 \n", "Chloroflexia 39.232639 12.389512 33.714982 33.729809 \n", "Anaerolineae 7.563068 8.093207 12.700394 5.805170 \n", "Gitt-GS-136 32.893768 25.674890 16.513631 14.872794 \n", "JG30-KF-CM66 11.278298 14.352700 12.845233 7.245688 \n", "KD4-96 21.173096 12.194261 35.686132 26.470739 \n", "TK10 25.951879 45.970643 38.448667 43.888495 \n", "Ktedonobacteria 3.563706 4.438468 4.086563 5.319774 \n", "Dehalococcoidia 5.873670 11.104053 14.525839 9.476286 \n", "Bacteroidia 141.663333 188.279845 143.224649 194.803747 \n", "Fimbriimonadia 7.596052 3.834058 4.098780 3.646917 \n", "uncultured 4.438468 3.420526 1.923538 2.701851 \n", "Acidobacteriia 29.364945 6.942622 18.088670 28.455228 \n", "Acidimicrobiia 109.917242 47.300106 46.301188 55.410288 \n", "Thermoleophilia 254.825430 135.417133 190.525064 174.316666 \n", "0319-7L14 85.207394 81.041964 50.257338 56.389715 \n", "Nitriliruptoria 17.840964 14.747881 12.409674 4.560702 \n", "Rubrobacteria 67.310475 71.333723 193.530359 158.676400 \n", "MB-A2-108 14.754660 18.686894 3.435113 4.147288 \n", "Thermoanaerobaculia 11.436783 10.285913 11.567195 16.269604 \n", "Subgroup 51.200586 37.036469 44.549972 42.710654 \n", "Holophagae 25.416530 14.307341 12.095454 36.833409 \n", "Blastocatellia 31.546791 14.876155 33.899853 36.929663 \n", "Actinobacteria 445.351771 581.639321 223.156895 274.296919 \n", "\n", "Category GC content \n", "Enzyme ImProm-II 42C ImProm-II 55C SuperScriptIV TGIRT \n", "Low abundance 0.500000 0.500000 0.500000 0.500000 \n", "Verrucomicrobiae 0.534486 0.533333 0.532315 0.532096 \n", "Unclassified 0.492766 0.507756 0.505267 0.503933 \n", "Alphaproteobacteria 0.554835 0.553426 0.562606 0.563610 \n", "Deltaproteobacteria 0.563930 0.566020 0.565218 0.565658 \n", "Gammaproteobacteria 0.543056 0.536829 0.544228 0.545745 \n", "Planctomycetacia 0.598206 0.624758 0.607147 0.619704 \n", "Phycisphaerae 0.576535 0.573142 0.572757 0.577386 \n", "Saccharimonadia 0.503040 0.501756 0.496003 0.496590 \n", "Longimicrobia 0.615191 0.616098 0.615348 0.614556 \n", "Gemmatimonadetes 0.626024 0.629010 0.626045 0.628619 \n", "BD2-11 0.609861 0.610253 0.608890 0.610935 \n", "S0134 0.589186 0.603075 0.599525 0.598523 \n", "Nitrospira 0.600736 0.599553 0.599522 0.599818 \n", "Bacilli 0.522874 0.533793 0.531269 0.537584 \n", "Fibrobacteria 0.554449 0.554841 0.553832 0.553822 \n", "Entotheonellia 0.576794 0.576664 0.576262 0.575045 \n", "Deinococci 0.565357 0.574220 0.561380 0.564073 \n", "Oxyphotobacteria 0.546075 0.544738 0.546060 0.545485 \n", "Chloroflexia 0.639146 0.644771 0.639664 0.640914 \n", "Anaerolineae 0.552375 0.559423 0.561238 0.564171 \n", "Gitt-GS-136 0.560948 0.561890 0.561070 0.560207 \n", "JG30-KF-CM66 0.596772 0.597473 0.597070 0.597318 \n", "KD4-96 0.569651 0.569340 0.569242 0.568869 \n", "TK10 0.614815 0.628671 0.618417 0.616980 \n", "Ktedonobacteria 0.578646 0.578946 0.580507 0.580245 \n", "Dehalococcoidia 0.578148 0.577860 0.577543 0.578580 \n", "Bacteroidia 0.514352 0.514383 0.513738 0.508924 \n", "Fimbriimonadia 0.542453 0.543326 0.536859 0.541226 \n", "uncultured 0.608757 0.612651 0.611116 0.616270 \n", "Acidobacteriia 0.555791 0.561708 0.561813 0.559804 \n", "Acidimicrobiia 0.585221 0.586662 0.588191 0.587488 \n", "Thermoleophilia 0.589096 0.588953 0.589492 0.589915 \n", "0319-7L14 0.580750 0.582987 0.581233 0.582942 \n", "Nitriliruptoria 0.576569 0.578654 0.576860 0.577517 \n", "Rubrobacteria 0.597608 0.600372 0.601017 0.601583 \n", "MB-A2-108 0.608917 0.608527 0.608236 0.605956 \n", "Thermoanaerobaculia 0.582242 0.582820 0.583003 0.582521 \n", "Subgroup 0.580126 0.580621 0.579717 0.580671 \n", "Holophagae 0.567214 0.566678 0.568034 0.568013 \n", "Blastocatellia 0.543584 0.546420 0.548164 0.549827 \n", "Actinobacteria 0.583321 0.583805 0.584725 0.586320 " ] }, "execution_count": 27, "metadata": {}, "output_type": "execute_result" } ], "source": [ "import pandas as pd\n", "import math\n", "\n", "df1 = pd.read_csv(\"GC_class_forFigure_ordered.csv\", header=[0,1], index_col=0)\n", "df1.columns.names = [\"Category\", \"Enzyme\"]\n", "df1" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "|Enzyme |TGIRT |SuperScriptIV|Promega42 |Promega55|\n", "|:-------------|:-----:|:-----------:|:---------:|:-------:|\n", "|TGIRT | x | TvS | Tv42 | Tv55 | \n", "|SuperScriptIV | TvS | x | Sv42 | Sv55 |\n", "|Promega42 | Tv42 | Sv42 | x | P42v55 |\n", "|Promega55 | Tv55 | Sv55 | P42v55 | x |" ] }, { "cell_type": "code", "execution_count": 41, "metadata": {}, "outputs": [], "source": [ "def relativeEnrichment(x, y, stdDevX, stdDevY):\n", " valueVect = []\n", " errorVect = []\n", " \n", " for a, b, stdDevA, stdDevB in zip(x, y, stdDevX, stdDevY):\n", " value = (a-b)/(a+b)\n", " \n", " ab_1 = 2/(math.pow((a+b), 2))\n", " ab_2 = math.sqrt(math.pow(b,2)*math.pow(stdDevA,2) + math.pow(a,2)*math.pow(stdDevB,2))\n", " error = ab_1*ab_2\n", " \n", " valueVect.append(value)\n", " errorVect.append(math.fabs(error))\n", " \n", " return valueVect, errorVect" ] }, { "cell_type": "code", "execution_count": 42, "metadata": {}, "outputs": [], "source": [ "idx = pd.IndexSlice\n", "\n", "TvS, TvSerror = relativeEnrichment(df1.loc[:, idx[\"Average\", \"TGIRT\"]],\n", " df1.loc[:, idx[\"Average\", \"SuperScriptIV\"]],\n", " df1.loc[:, idx[\"StdDev\", \"TGIRT\"]],\n", " df1.loc[:, idx[\"StdDev\", \"SuperScriptIV\"]])\n", "df1[\"Comparison\", \"TvS\"] = TvS\n", "df1[\"Comparison\", \"TvSerror\"] = TvSerror\n", "\n", "Tv42, Tv42error = relativeEnrichment(df1.loc[:, idx[\"Average\", \"TGIRT\"]],\n", " df1.loc[:, idx[\"Average\", \"ImProm-II 42C\"]],\n", " df1.loc[:, idx[\"StdDev\", \"TGIRT\"]],\n", " df1.loc[:, idx[\"StdDev\", \"ImProm-II 42C\"]])\n", "df1[\"Comparison\", \"Tv42\"] = Tv42\n", "df1[\"Comparison\", \"Tv42error\"] = Tv42error\n", "\n", "Tv55, Tv55error = relativeEnrichment(df1.loc[:, idx[\"Average\", \"TGIRT\"]],\n", " df1.loc[:, idx[\"Average\", \"ImProm-II 55C\"]],\n", " df1.loc[:, idx[\"StdDev\", \"TGIRT\"]],\n", " df1.loc[:, idx[\"StdDev\", \"ImProm-II 55C\"]])\n", "df1[\"Comparison\", \"Tv55\"] = Tv55\n", "df1[\"Comparison\", \"Tv55error\"] = Tv55error\n", "\n", "Sv42, Sv42error = relativeEnrichment(df1.loc[:, idx[\"Average\", \"SuperScriptIV\"]],\n", " df1.loc[:, idx[\"Average\", \"ImProm-II 42C\"]],\n", " df1.loc[:, idx[\"StdDev\", \"SuperScriptIV\"]],\n", " df1.loc[:, idx[\"StdDev\", \"ImProm-II 42C\"]])\n", "df1[\"Comparison\", \"Sv42\"] = Sv42\n", "df1[\"Comparison\", \"Sv42error\"] = Sv42error\n", "\n", "Sv55, Sv55error = relativeEnrichment(df1.loc[:, idx[\"Average\", \"SuperScriptIV\"]], \n", " df1.loc[:, idx[\"Average\", \"ImProm-II 55C\"]],\n", " df1.loc[:, idx[\"StdDev\", \"SuperScriptIV\"]], \n", " df1.loc[:, idx[\"StdDev\", \"ImProm-II 55C\"]])\n", "df1[\"Comparison\", \"Sv55\"] = Sv55\n", "df1[\"Comparison\", \"Sv55error\"] = Sv55error\n", "\n", "P42v55, P42v55error = relativeEnrichment(df1.loc[:, idx[\"Average\", \"ImProm-II 42C\"]],\n", " df1.loc[:, idx[\"Average\", \"ImProm-II 55C\"]],\n", " df1.loc[:, idx[\"StdDev\", \"ImProm-II 42C\"]],\n", " df1.loc[:, idx[\"StdDev\", \"ImProm-II 55C\"]])\n", "df1[\"Comparison\", \"P42v55\"] = P42v55\n", "df1[\"Comparison\", \"P42v55error\"] = P42v55error" ] }, { "cell_type": "code", "execution_count": 43, "metadata": {}, "outputs": [], "source": [ "import matplotlib.pyplot as plt\n", "from matplotlib import cm\n", "import numpy as np\n", "\n", "default_dpi = plt.rcParamsDefault[\"figure.dpi\"]\n", "plt.rcParams[\"figure.figsize\"] = [6,8]\n", "\n", "def barplotFigure(y, y_stdDev, GC_content, name):\n", " # Bar position\n", " x_pos = np.arange(len(y))\n", " # \"Stretching\" color values betwenn 0 and 1 to get the best colourfulness\n", " col_norm =(GC_content-min(GC_content))/(max(GC_content-min(GC_content)))\n", " # Getting color pallette\n", " colors = cm.viridis(col_norm)\n", " \n", " # Legend construction\n", " plot = plt.scatter(GC_content, GC_content, c=GC_content, cmap=\"viridis\")\n", " plt.clf()\n", " plt.colorbar(plot)\n", "\n", " # Barplot \n", " plt.barh(x_pos, y, xerr=y_stdDev, color=colors, align=\"center\")\n", " #plt.errorbar(y, x_pos, 0, y_stdDev)\n", " plt.yticks(x_pos, df1.index.values)\n", " plt.title(name)\n", " \n", " axes = plt.gca()\n", " axes.set_xlim([-0.8,0.8])\n", " \n", " plt.savefig(name+\".pdf\", bbox_inches=\"tight\")" ] }, { "cell_type": "code", "execution_count": 44, "metadata": {}, "outputs": [ { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "name = \"SuperScriptIV : TGIRT \" \n", "barplotFigure(y=df1[\"Comparison\", \"TvS\"],\n", " y_stdDev=df1[\"Comparison\", \"TvSerror\"],\n", " GC_content=df1[\"GC content\", \"TGIRT\"], name=name)\n", "\n", "name = \"ImProm-II 42°C : TGIRT \" \n", "barplotFigure(y=df1[\"Comparison\", \"Tv42\"],\n", " y_stdDev=df1[\"Comparison\", \"Tv42error\"],\n", " GC_content=df1[\"GC content\", \"ImProm-II 42C\"], name=name)\n", "\n", "name = \"ImProm-II 55°C : TGIRT \" \n", "barplotFigure(y=df1[\"Comparison\", \"Tv55\"],\n", " y_stdDev=df1[\"Comparison\", \"Tv55error\"],\n", " GC_content=df1[\"GC content\", \"ImProm-II 55C\"], name=name)\n", "\n", "name = \"ImProm-II 42°C : SuperScriptIV \" \n", "barplotFigure(y=df1[\"Comparison\", \"Sv42\"],\n", " y_stdDev=df1[\"Comparison\", \"Sv42error\"],\n", " GC_content=df1[\"GC content\", \"ImProm-II 42C\"], name=name)\n", "\n", "name = \"ImProm-II 55°C : SuperScriptIV \" \n", "barplotFigure(y=df1[\"Comparison\", \"Sv55\"],\n", " y_stdDev=df1[\"Comparison\", \"Sv55error\"],\n", " GC_content=df1[\"GC content\", \"ImProm-II 55C\"], name=name)\n", "\n", "name = \"ImProm-II 55°C : ImProm-II 42°C\" \n", "barplotFigure(y=df1[\"Comparison\", \"P42v55\"],\n", " y_stdDev=df1[\"Comparison\", \"P42v55error\"],\n", " GC_content=df1[\"GC content\", \"ImProm-II 42C\"], name=name)" ] } ], "metadata": { "kernelspec": { "display_name": "Python 3", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.6.8" } }, "nbformat": 4, "nbformat_minor": 2 }