{ "cells": [ { "cell_type": "code", "source": [ "pip install Bio" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "g_QUWLpGA4Uy", "outputId": "e435d12b-df6f-4b6f-9ea7-4ed082369d8a" }, "execution_count": 1, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n", "Requirement already satisfied: Bio in /usr/local/lib/python3.7/dist-packages (1.3.9)\n", "Requirement already satisfied: requests in /usr/local/lib/python3.7/dist-packages (from Bio) (2.23.0)\n", "Requirement already satisfied: tqdm in /usr/local/lib/python3.7/dist-packages (from Bio) (4.64.0)\n", "Requirement already satisfied: mygene in /usr/local/lib/python3.7/dist-packages (from Bio) (3.2.2)\n", "Requirement already satisfied: biopython>=1.79 in /usr/local/lib/python3.7/dist-packages (from Bio) (1.79)\n", "Requirement already satisfied: numpy in /usr/local/lib/python3.7/dist-packages (from biopython>=1.79->Bio) (1.21.6)\n", "Requirement already satisfied: biothings-client>=0.2.6 in /usr/local/lib/python3.7/dist-packages (from mygene->Bio) (0.2.6)\n", "Requirement already satisfied: idna<3,>=2.5 in /usr/local/lib/python3.7/dist-packages (from requests->Bio) (2.10)\n", "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /usr/local/lib/python3.7/dist-packages (from requests->Bio) (1.24.3)\n", "Requirement already satisfied: chardet<4,>=3.0.2 in /usr/local/lib/python3.7/dist-packages (from requests->Bio) (3.0.4)\n", "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.7/dist-packages (from requests->Bio) (2022.6.15)\n" ] } ] }, { "cell_type": "code", "execution_count": 2, "metadata": { "id": "k1GKvofMTHXV" }, "outputs": [], "source": [ "from Bio import SeqIO\n", "from sklearn.metrics import confusion_matrix,classification_report\n", "import numpy as np\n", "import pandas as pd\n", "import matplotlib.pyplot as plt\n", "import seaborn as sns\n", "import tensorflow as tf\n", "from sklearn.model_selection import train_test_split\n", "from sklearn.preprocessing import LabelEncoder\n", "from tensorflow.keras.models import Model\n", "from tensorflow.keras.layers import LSTM, Activation, Dense, Dropout, Input, Embedding\n", "from tensorflow.keras.optimizers import RMSprop\n", "from tensorflow.keras.preprocessing.text import Tokenizer\n", "from tensorflow.keras.preprocessing import sequence\n", "from tensorflow.keras.utils import to_categorical\n", "from tensorflow.keras.callbacks import EarlyStopping\n", "%matplotlib inline\n", "from tensorflow.keras.preprocessing.sequence import pad_sequences\n", "from tensorflow.keras.layers import Embedding\n", "from tensorflow.keras.layers import Dense, Input, Flatten\n", "from tensorflow.keras.layers import Conv1D, MaxPooling1D, Embedding, Dropout\n", "from tensorflow.keras.models import Model\n", "from tensorflow.keras.callbacks import ModelCheckpoint\n", "from tensorflow.keras.models import Sequential" ] }, { "cell_type": "code", "source": [ "from google.colab import drive\n", "drive.mount('/content/drive')" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "IBWrhsbJEYM4", "outputId": "402eb2d3-3d72-4909-ac4a-52f438951d53" }, "execution_count": 3, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Drive already mounted at /content/drive; to attempt to forcibly remount, call drive.mount(\"/content/drive\", force_remount=True).\n" ] } ] }, { "cell_type": "code", "execution_count": 4, "metadata": { "id": "klPpounuTHXc", "colab": { "base_uri": "https://localhost:8080/" }, "outputId": "1187fa44-8beb-4161-e0f7-615c507de9a1" }, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "['FAKKFAKKFKKFAKKFAKFAFAF', 'ICLRLPGC', 'FLGSIVGALASALPSLISKIRN', 'FGLPMLSILPKALCILLKRKC', 'CGESCVWIPCVTSIFNCKCKENKVCYHDKIP', 'KLAKLAK', 'GLFDIVKKVVGAIGSL', 'AKRHHGYKRKFH', 'FMPILSCSRFKRC', 'GRKKRRQRRRGGWMWVTNLRTD', 'GIGKFLKKAKKFAKAFVKMNN', 'GIGKFLKKAKKFAKAFVKIINN', 'GLMDTIKGVAKTVAASWLDKLKCKITGC', 'LLRHVVKILSKYL', 'KFKKLAKKF', 'TILLEIKNINAD', 'GLFKVIKKVAKVIKKL', 'FIFHIIKGLFHAGKMIHGLVTRRRH', 'ALYKKFKKKLLKSLKRL', 'TFRAFLSSRLQDLYSIVRRADRAAV', 'AVPDVAFNAYG', 'MRKEFHNVLSSGQLLADKRPARDYNRK', 'YAIDTILAEIKNINA', 'GKWLSLLKHILK', 'FVKLKKILNIILSIFKK', 'GFLGPLLKLAAKGVAKVIPHLIPSRQQ', 'DTHFPICIFCCGCCHRSKCGMCCKT', 'HGVSGHGQHGVHG', 'CKQSCSFGPFTFVCDGNTK', 'GKWMSLLKHILK', 'KWKLFKKIPKFLHL', 'KWKLFKKIGIGAVLKVLKKG', 'FALKALKK', 'FLPVVAGLAAKVLPSIICAVTKKC', 'CGETCVGGTCNTPGCTCSWPVCTRNGLPV', 'AIKLVQSPNGNFAASFVLDGTKWIFKSKYYDSSKGYWVGIYEVWDRK', 'KSCCPNTTGRNIYNTCRLGGGSRERCASLSGCKIISASTCPSDYPK', 'LKCNKLVPLFYKTCPAGKNL', 'KWFKKIPKFLHLAKKF', 'CGESCAMISFCFTEVIGCSCKNKVCYLNSIS', 'FAKLLAKFLKKAL', 'ETWRTEAPSATGQASSLLGGRLLGQ', 'AKWVGDLTLCRWR', 'KILRGVAKKIMRTFLRRILTGKK', 'CGESCVFIPCISTLLGCSCKNKVCYRNGVIP', 'SPWPRPTY', 'FLSFPTTKTYFPHFDLSHGSAQVKGHGAK', 'VALALKALKKL', 'GAARKSIRLHRLYTWKATIYTR', 'GLFAVIKKVASVIGGL', 'CRQSCSFGPLTFVCDGNTK', 'FVQWFSKFLGRIL', 'GWLKKIGKKIERVGQHTRDATIQTIGVAQQAANVAATLK', 'GLFDIVKKVVGALGSL', 'FLFPLITSFLSKVL', 'GLPVCGETCFGGTCNTPGCSCETWPVCSRN', 'FAKKLKKLAKLAKKL', 'GTGLPMSERRKIMLMMR', 'VALALKALKKALKKLKKALKKAL', 'GLLPCAESCVYIPCLTTVIGCSCKSKVCYKN', 'VAKLLAKLAKKVL', 'FAKLLAKLAKKLL', 'PGLGFY', 'GFGKAFHSVSNFAKKHKTA', 'VECYGPNRPQF', 'LKLKSIVSWAKKVL', 'FFPIGVFCKIFKTC', 'GFFSTVKNLATNVAGTVIDTLKCKVTGGCRS', 'FAKKLAKKLKKLAKKLAKKWKL', 'KWKKFLKIGIGKFLHLAKKF', 'FKRIVQRIKDFLR', 'DYPKLTFTTS', 'KWKSFLKTFKSAKKTVLHTLLKAISS', 'VNWKKILPKIIKVVK', 'GLPVCGETCFGGTCNTPGCTCDPWPVCTRN', 'FAGLAANFLPTIICKISYKC', 'ADRGWIKTLTKDCPNVISSICAGTIITACKNCA', 'AANFGPSVFTPEVHETWQKFLNVVVAALGKQYH', 'GVPICGETCTLGTCYTAGCSCSWPVCTRN', 'EPHPDEFVGLM', 'KYKKALKKLAKLL', 'GSSSGRGDSPA', 'KAAKKAWKAAKKAAKWWKKAA', 'AKCIKNGKGCREDQGPPFCCSGFCYRQVGWARGYCKNR', 'GLKKLLGKLLKKLGKLLLK', 'GIIKKIIKKIIKKIIKKI', 'FLKWLFKWAKK', 'FAKKLAKLAKKL', 'FIFHIIKGLFHAGKMI', 'GLFDIVKKVVGTIAGL', 'EFTNVSCTTSKECWSVCQRLHNTSRGKCMNKKCRCYS', 'LLGDFKRIVQRIKDF', 'FLSSIGKILGNLL', 'PAWRKARRWARRMKKLAA', 'GKWMSLLKKILK', 'ALSKALSKALSKALSKALSKALSK', 'FLPAVLRVAAKIVPTVFCAISKKC', 'ATCDLLSGFGVGDSACAAHCIARGNRGGYCNSKKVCVCPI', 'GLFAVIKKVASVIKGL', 'KWFKKIPKFLHLLKKF', 'GFMDTAKNVAKNVAVTLIDNLKCKITKAC', 'RKGWFKAMKSIAKFIAKEKLKEHL', 'GLFDIIKKIAESF', 'FVKLKKIANIINSIFKK', 'FLPLIAGLAANFLPKIFCAITKKC', 'RAGLQFPVGRLLRRLLRRLLR', 'LLRHVVKILEKYL', 'GLFDKLKSLVSDF', 'AIGSILGALAKGLPTLISWIKNR', 'FLPIASLLGKYL', 'KISKRILTGKK', 'FLPLAVSLAANFLPKLFCKITKKC', 'KRAKAAGGWSHWSPWSSC', 'AVLDILKDVGKGLLSHFMEKV', 'GLPVCGETCVGGTCNTPGCACSWPVCTRN', 'ACIKNGGRCVASGGPPYCCSNYCLQIAGQSYGVCKKH', 'FLPLLLAGLPKLLCLFFKKC', 'GLFVGVLAKVAAHVVPAIAEHF', 'VNWKKIILGKIIKVVK', 'KILRGVAKKIMRTFLRRISKDILTGKK', 'FLFRVASKVFPALIGKFKKK', 'CIAKGNGCQPSGVQGNCCSGHCHKEPGWVAGYCK', 'AGECVQGRCPSGMCCSQFGYCGRGPKYCGR', 'ALLGDFFRKSKEKIGKEFKRIVQRIKDFLRNLVPRTES', 'CANSCSYGPLTWSCDGNTK', 'DFGCGQGMIFMCQRRCMRLYPGSTGFCRGFRCMCDTHIPLRPPFMVG', 'FLSLIPKLVKKIIKAFK', 'FFSLLPSLIGGLVSAIK', 'VNWKKILAKIIKVVK', 'FLSAITSLLGKLL', 'AAVPIVNLKDELLFPSWEALFSGSE', 'FAKIIAKIAKIAKKIL', 'LVPCLPGC', 'ATCDLLSGTGINHSACAAHCLLRGNRGGYCNGKAVCVCRN', 'KKVVFKVKFK', 'PGMGIYLPM', 'FLGMIPKLIKKLIKAFK', 'GLFDIVKKIAGHIVSSI', 'GIPCAESCVWIPPCTITALMGCSCKNNVCYNN', 'GIPCAESCVWIPCTVTALIGCGCSNKVCYN', 'FKVKFKVKVK', 'FALKALKKAL', 'GLFDVIKKVASVIKKL', 'GLFSVLGAVAKHVLPHVVPVIAEKL', 'KAFWGLQH', 'VYWKKILGKIIKVVK', 'GFGCPNNYQCHRHCKSIPGRCGGYCGGWHRLPCTCYRCG', 'LKKLAKLALAF', 'FAKLFAKLAKKFAL', 'KRLRRVWRRWR', 'FAKLLAKALKKFAL', 'FLLFPLMCKIQGKC', 'ASIVKTTIKASKKLCRGFTLTCGCHFTGKK', 'CTGAAGGTGCTGTCCCAGAT', 'GFMKYIGPLIPHAVKAISDLI', 'DHYNCVSSGGQCLYSACPIFTKIQGTCYRGKAKCCK', 'FAKFLAKFLKKAL', 'GLFAVIKKVAAVIRRL', 'FKRIVQRIKDFLRNLV', 'FFGHLFKLATKIIPSLFQ', 'FAKLFAKAFKKAL', 'KAAKKWAKAAKKWAKAWKKAA', 'AFKLLGRIIHHVGNFVYGFSHVF', 'PAWRKAFRWAWRMKKLAA', 'GLFDIVKKVVGAFGSL', 'GVGSPYVSRLLGICL', 'FLPLLASLFSGLF', 'ILRWPWWPWRRK', 'GLPTCGETCTLGTCYVPDCSCSWPICMKN', 'KAQIRAMECNIL', 'FLPLVTMLLGKLF', 'KTCENLADTY', 'KAAKKAWKWAKKAAKWAKKAA', 'LLGDFFRKSKEKIGKEFKRIVQRIKDFLRNLVPRTES', 'FAKKLAKLALKLAKL', 'PRFWEYWLRLME', 'VAKLLAKLAKKLL', 'GLLGPLLKIAAKVGSNLL', 'AKKVFKRLEKLFSKIQNDK', 'RFRLPFRRPPIRIHPPPFYPPFRRFL', 'MPKEKVFLKIEKMGRNIRN', 'EPNPDEFFGLM', 'ATRVVYCNRRSGSVVGGDDTVYYEG', 'GGLRSLGRKILRAWKKYGPIIVPIIRI', 'FLSLIPHIVSGVASIAKHF', 'DDTPSSRCGSGGWGPCLPIVDLLCIVHVTVGCSGGFGCCRIG', 'CIPMAWAVSWPHP', 'DYDWSLRGPPKCATYGQKCRTWSPRNCCWNLRCKAFRCRPR', 'GWRTLLKKAEVKTVGKLALKHYL', 'GLFDIVKKIAGHIA', 'GLFDIIKKIAESI', 'FAKLLKLAAKKLL', 'MPKWKVFKKIEKVGRNIRNGIVKAGPAIAVLGEAKALG', 'GIGKFLKKAKKFGKAFVKILKK', 'GMWSKLLGHLLR', 'FALLKL', 'VNWKKILKKIIKVVK', 'GAIKDALKGAAKTVAVELLKKAQCKLEKTC', 'YAIDTILLEIKNINAD', 'GFFALIPKIISSPLFKTLLSAVGSALSSSGGQE', 'GSIPCGESCVFIPCISAIIGCSCSSKVCYKN', 'FLPILGKLLSGIL', 'ENFFKEIERAGQRIRDAIISAAPAVETLAQAQKIIKGGD', 'FAKALAKLAKKLL', 'ECRRLCYKQRCVTYCRGR', 'ALKAALLAILKIVRVIKK', 'HSHRDFQPVLHLVALNSPLSGGMRG', 'FFRLLFHGVHHVGKIKPRA', 'ALWMTLLKKVLKAAAKALNAVLVGANA', 'FAFAKIIAKIAKKII', 'KIAKVALAKLGIGAVLKVLTTGL', 'KWKLFKKKTKLFKKFAKKLAKKL', 'FFRHLFRGAKAIFRGARQGWRAHKVVSRYRNRDVPETDNNQEEP', 'RGDLLRHVVKILSKYL', 'KWLRRVWRWWR', 'GSIPCGESCVFIPCISSVIGCACKSKVCYKN', 'GADFQECMKEHSQKQHQHQG', 'NVWKKILGKIIKVVK', 'PAWAKAFRAAARMKLKAA', 'EGGGPQWAVGHFM', 'FAKLWAKLAKKL', 'MRKWFHNVLSSGQLLADKWPAWDYNRK', 'FFGAIAAALPHVISAIKNAL', 'KAAKKAWKAWKKAAKAAWKKAA', 'KWKSFAKTFKSAKKTVLHTALKAISS', 'GFGCPLNQGACHNHCRSIGRRGGYCAGIIKQTCTCYRK', 'MPRWRLFRRIDRVGKQIKQGILRAGPAIALVGDARAVG', 'KWKLFKKIGIGKFKLAKKF', 'GSIPCEGSCVFIPCISAIIGCSCSNKVCYKN', 'PRFWEYALRLME', 'GFGCNGPWDEDDMQCHNHCKSIKGYKGGYCAKGGFVCKCY', 'VAKALKALLKALKAL', 'FAVGLRAIKRALKKLRRGVRKVAKDL', 'KWKLFKKIPKFLHLAK', 'KTCENLADTFRGPCFATSNC', 'FISAIASFLGKFL', 'GIPCGESCVFIPCITAAIGCSCKSKVCYRN', 'FLSLIPHAINAVSALANHG', 'MWKEFHNVLSSGQLLADKRWARWYNRW', 'KAKLF', 'FAKLLAKLAKK', 'GLLSVLGSVAKHVLPHVVPVIAEHL', 'FKVQNQHGQVVKIFHH', 'FAKIIAKIAKKI', 'FLGALAKIISGIF', 'GFKDWIKGAAKKLIKTVASSIANQ', 'SWLSKTAKKLENSAKKRISEGIAIAIQGGPR', 'FIGTALGIASAIPAIVKLFK', 'VNWKKILGKIKKVVK', 'WKLFKKIPKFLHLAKKF', 'FALALKALKKLLKKLKKLAKKAL', 'VALALKALKKLAKKLKKLAKKAL', 'FLGALFHALSKLL', 'GLVTSLIKGAGKLLGGLFGSVTGGQS', 'ELCEKASQTWSGTCGKTKHCDDQCKSWEGAAHGACHVRDGKHMCFCYFNC', 'GLPVCGETCFTGTCYTNGCTCDPWPVCTRN', 'FLPIVGRLISGLL', 'ACSAG', 'KWKLFKKIPLAKKF', 'KAFDITYVRLKF', 'FLGWLFKWAWK', 'DAEFRHDSGYEVHHQKLVFFAEDVGSNKGAIIGLMVGGVVIA', 'FVDLKKIANIINSIF', 'DCYCRIPACIAGERRYGTCIYQGRLWAFCC', 'KWKLFKKIPLHLAKKF', 'ALWKTLLKNVGKAAGKAALNAVTDMVNQ', 'GFGMALKLLKKVL', 'LRVRLASHLRKLRKRLLRDADDLQKRLAVY', 'ASSSYPLIHWRPWAR', 'GFCRCLCRRGVCRCICTR', 'LMMLILAMNRKDKKKEKK', 'FLSAIASMLGKFL', 'DLRFWNPREKLPLPTLPPFNPKPIYIDMGNRY', 'KWKLFKKALKKLKKALKKAL', 'FAKAIAKIAFGKGIGKVGKKLL', 'KAYARIGNSYFK', 'QETFSDLWKLLP', 'KWWKKAAKAAKKAAKAAKKWA', 'DDALRRLLRRLLRRL', 'ACYCRIPACFAGERRYGTCFYLGRVWAFCC', 'RLFDKIRQVIRKF', 'FAKLLAKLAK', 'GLFGVLAKVAAHVVPAIAEHF', 'GLFDIIKKVASVVGGL', 'TCCATGACGTTCCTGACGTT', 'ALWKDILKNAGKAALNEINQLVNQ', 'YGRKKRRQRRRREADFFWSLCTADMS', 'FAKKLAKKLAKAL', 'GIGDPVTCLKSGAICHPVFCPRRYKQIGTCGLPGTK', 'GQVWEATATVNAIRGSVTPAVSQFNARTAD', 'GMWKKILGHLIR', 'KWKSFLKTFKSAKKTVAHTALKAISS', 'AKIPIKAIKTVGKAVGKGLRAINIASTANDVFNFLKPKKRKA', 'NYQWVPYQGRVPYPRGGLLKLLKKLLKKLLKL', 'GLMSSIGKALGGLIVDVLKPKTPAS', 'AGWGSIFKHIFKAGKFIHGAIQAHND', 'KWKLFKKIPKFLHLAKK', 'QAGGQTCPGGICCSQWGYCGTTADYCSPNNNCQSNCWASG', 'GKWMTLLKHILK', 'LLGDFFRKSKEK', 'GFGCPGNQLKCNNHCKSISCRAGYCDAATLWLRCTCTDCNGKK', 'FCTMIPIPRCY', 'FAKKLAKLAKKLAKLAL', 'FLPLIGKILGTIL', 'GLFAVIKKVAKVIKKL', 'FIHHIFRGIVHAGRSIGRFLTG', 'PAARKAARWAWRMLKKGA', 'FAKKLAKKLKKLAKLALAK', 'IVRRADRAAVP', 'GLLSVLGSVAQHVLPHVVPVIAEHL', 'KWKLFKKIPHLAKKF', 'ATCDLLSKWNWNHTACAGHCIAKGFKGGYCNDKAVCVCRN', 'FALALKALKKLAKKLKKLAKKAL', 'CAAGTACTCAGTGTGGA', 'WALAL', 'GKWMKLLKHILK', 'VAKKLAKLAKKLLAL', 'FLPLIGRVLSGIL', 'KWKLAKKALALL', 'GCASRCKAKCAGRRCKGWASASFRGRCYCKCFRC', 'GIPCGESCVFIPCLTSAIDCSCKSKVCYRN', 'KFKKLAKKW', 'DWTAWSALVAAACSVELL', 'FLPLLAGLAANFLPTIICKISYKC', 'PLLQATLGGGS', 'DPVTYIRNGGICQYRCIGLRHKIGTCGSPFKCCK', 'RRRRRRRRGEDIIRNIARHLAQVGDSMDR', 'FLGALFKALSHLL', 'FAKKLAKKLKKLAKKLAKLAKKL', 'KWKLFKKIGIGKFLHSAKKF', 'KWKSFLKTFKSLKKTVLHTLLKLISS', 'DLRFLYPRGKLPVPTLPPFNPKPIYIDMGNRY', 'FAKLLAKAFKKAL', 'GVPVCGETCFGGTCNTPGCSCDPWPVCSRN', 'FIGLLISAGKAIHDLIRRRH', 'KWKLFKKIPKFLH', 'PAWFKARRWAWRMKKLAA', 'VNWKKILGKIIKVVK', 'FLPIVAKLLSGLL', 'KWKLFKKIPFLHLAKKF', 'FAKLA', 'FLPIVTNLLSGLL', 'MWKWFHNVLSSGQLLADKWWAWWYNWW', 'KLLLKLKLKLLK', 'CSTNTFSLSDYWGNNGAWCTLTHECMAWCK', 'KWKLFKKIPKFLHLAKKF', 'GKWSKILGHLIR', 'FELDRICGYGTARCRKKCRSQEYRIGRCPNTYACCLRKWDESLLNRTKP', 'FAKKALKALKKL', 'FLGALFKVASKVLPSVFCAITKKC', 'FAKLLAKLAKKGL', 'FDIVKKIAGHIVSSI', 'GFKMALKLLKKVL', 'KSCCPNTTGRNIYNTCRFGGGSRQVCASLSGCKIISASTCPSDYPK', 'GMWSKILGHLIR', 'KWKLFKKIGPGKFLHSAKKF', 'GIGKFLHAAKKFAKAFVAEIMNS', 'AALKGCWTKSIPPKPCFGKR', 'ALSILKGLEKLAKMGIALTNCKATKKC', 'KLLLKLLKKLLKLLKKK', 'ACYCRIPACIAGERRYGTCIYQGRLWAFCC', 'GVPICGETCVGGTCNTPGCSCSWPVCTRN', 'RGDLLRHVVKILEKYL', 'PPPEE', 'CCTAAGCCCTTGTGGTGTGT', 'VAKALAKALLKALKAL', 'PAWRKAFRWAKRMLKKAA', 'DIQIPGIKKPTHRDIIIPNWNPNVRTQPWQRFGGNKS', 'VYINKLTPPCGTMYYACEAV', 'FAKLLAKALKKAL', 'LTAEHYAAQATS', 'GMWKKILGKLIR', 'FAKKLAKKLAKLL', 'TTGGTCCTTCAAGAGCTG', 'HTLLTPRR', 'VAKKLAKLAKKLAKLALAL', 'ATCDLASGFGVGSSLCAAHCIARRYRGGYCNSKAVCVCRN', 'GLPVCGETCVGGTCNTPGCGCSWPVCTRN', 'IPCGESCVWIPCISGMFGCSCKDKVCYS', 'IFLLWQR', 'FALALKLKKL', 'VAKKLAKLAKKLAKLAL', 'GFGSLLGKALRLGANVL', 'KWKSFLKTFKSAKKTVLHTALKAISS', 'CHHNLAHAC', 'GFGCPFNQYECHAHCSGVPGYKGGYCKGLFKQTCNCY', 'GRENYHGCTTHWGFTLC', 'KLLRLLKKLLRLLLK', 'FLGLLFHGVHHVGKWIHGLIHGHH', 'HTMYYHHYQHHL', 'GEFLKCGESCVQGECYTPGCSCDWPICKKN', 'YHWYGYTPQNVIGGGKLLLKLLKKLLKLLKKK', 'GMWSKILKHLIR', 'FLPIITNLLGKLL', 'GLPICGETCVGGTCNTPGCSCSWPVCTRN', 'GLFDVIKKVASVIKGL', 'KNWKKILGKIIKVVK', 'FAKKLAKKLKKLAKKLAK', 'RYPAGLPFL', 'FLGMIPGLIGGLISAFK', 'FLPLVGKILSGLI', 'GSIPCGESCVFIPCISAVIGCSCSNKVCYKN', 'FFGTALKIAANILPTAICKILKKC', 'GLLQTIKEKLESLESLAKGIVSGIQA', 'CAGAGTGGGAGAGGCAAGAC', 'VNWRRILGRIIRVVR', 'HHPHG', 'FAKKLAKLAKKLLAL', 'AQCGAQGGGATCPGGLCCSQWGWCGSTPKYCGAGCQSNCK', 'IGKEFKRIVQRIKDFLRNLVPRTES', 'FLPIIAGVAAKVLPKIFCAISKKC', 'IPCGESCVWIPCITAIAGCSCKNKVCYT', 'DHYICAKKGGTCNFSPCPLFNRIEGTCYSGKAKCCIR', 'FKCRRWQWRMKK', 'FAKLLAKLAKKL', 'DSHEERRQGRHGHHEYGRKFHEKHHSHRGY', 'FLGGLMKAFPAIICAVTKKC', 'FAKLLAKLAKAKA', 'DFKLFAVTIKYR', 'RYLGYL', 'FIGPIISALASLFG', 'FALAAKALKKLAKKLKKLAKKAL', 'FALALKLAKKAL', 'PAARKAFRWAWRMLKKAA', 'GIPCGESCVWIPCISSAIGCSCKSKVCYRN', 'GIIKKIIIKKI', 'FLGALIKGAIHGGRFIHGMIQNHH', 'FALALKALKKL', 'KWKLFKKIGIGKFLHSATTF', 'FFGSVLKLIPKIL', 'DFKDWMKTAGEWLKKKGPGILKAAMAAAT', 'KTKLFKKFAKKLAKKLKKLAKKL', 'GDACGETCFTGICFTAGCSCNPWPTCTRN', 'HPTWPQKSVWHGSDPNGRRLTESY', 'KLKNFAKGVAQSLLNKASCKLSGQC', 'DFASCHTNGGICLPNRCPGHMIQIGICFRPRVKCCRSW', 'GFGMALRLLRRVL', 'GKWMSLLKHIWK', 'KAAKKWAKAWKKAAKAWKKAA', 'ALWKNMLKGIGKLAGQAALGAVKTLVGAE', 'FAKLLAKALKKL', 'RKKRRQRRR', 'GFGCPNNYACHQHCKSIRGYCGGYCAGWFRLRCTCYRCG', 'LIAHNQVRQV', 'GIGKFLHSAKKFGKAFVGEIMNS', 'KLAKKLAKLAKLAKAL', 'FAKKLAKKLAKLAL', 'PRFWEYWLRLAE', 'FALALKLAKKL', 'FLPAIAGILSQLF', 'GFLDIIKDTGKEFAVKILNNLKCKLAGGCPP', 'KIFGSLAFL', 'FALKALKKLKKALKKAL', 'RQVFQVAYIIIKA', 'GKWMSLLKHWLK', 'AAKKWAKAKWAKAKKWAKAA', 'GKWKSLLKHILK', 'KWKLFAKIGIGKFLHLAKKF', 'GLFDIAKKVIGVIGSL', 'KKKFPWWWPFKKK', 'GFGCPFNQGACHRHCRSIRRRGGYCAGLFKQTCTCYR', 'GLFVGLAKVAAHNNPAIAEHFQA', 'FLKLLAGLLKNFA', 'GFIFHIIKGLFHAGKMIHGLV', 'KLKNFAIGVAQSLLNKASCKLSGQC', 'GLLDIVKKVVGAFGSL', 'KAQIRAMECNILGRKKRRQRRR', 'EIRLPEPFRFPSPTVPKPIDIDPILPHPWSPRQTYPIIARRS', 'FAKLLAKLAKAKL', 'FVPYNPPRPYQSKPFPSFPGHGPFNPKIQWPYPLPNPGH', 'KSCCPNTTGRNIYNTCRFAGGSRERCAKLSGCKIISASTCPSDYPK', 'TCGTCCTGAGGAGAGAGAGC', 'LFGMALKLLKKVL', 'RWGKWFKKATHVGKHVGKAALTAYL', 'KWKSFLKTFKSAKKTVAHTAAKAISS', 'CTFTLPGGGGVCTLTSECIC', 'HHPHGHHPHGHHPHG', 'DTVACRIQGNFCRAGACPPTFTISGQCHGGLLNCCAKIPAQ', 'RLVSYNGIIFFLK', 'GKWMSLWKHILK', 'FKKLKKIANIINSIFKK', 'GIKCRFCCGCCTPGICGVCCRF', 'YPFPG', 'CHHNATHAC', 'NKWKKILGKIIKVVK', 'GMWSKILGKLIR', 'FALLKALKKAL', 'ALWKTMLKKLGTMALHAGKAALGAAADTISQGTQ', 'FLPILASLAATLGPKLLCLITKKC', 'GRFKRFRKKFKKLFKKLSPVIPLLHLG', 'AWKKWAKAWKWAKAKWWAKAA', 'RRRRRWCMNW', 'DCLSGKYKGPCAVWDNEMCRRICKEEGHISGHCSPSLKCWCEGC', 'KSCCPNTTGRNIYNTCRLTGSSRETCAKLSGCKIISASTCPSNYPK', 'FAKLWAKLAFGKGIGKVGKKLL', 'NHFTLKCPKTALTEPPTLAY', 'KWKLFKKIGIGAVLKVLTTG', 'GLFSVLGAVAKHVLPHVVPVIAEK', 'ELPKLPDDKVLIRSRSNCPKGKVWNGFDCKSPFAFS', 'ACDTATCVTHRLAGLLSRSGGVVKNNFVPTNVGSKAF', 'FALAKKALKKAKKAL', 'RQIKIWFQNRRMKWKK', 'DFKLFAVYIKYR', 'KWKLFKKIPLKKF', 'FALLKALLKKAL', 'AFTCHCRRSCYSTEYSYGTCTVMGINHRFCCL', 'MTLTG', 'FALALKKALKALKKAL', 'FKLAFKLAKKAFL', 'LTFEHYWAQLTS', 'ETFSDLWKLL', 'KWCFRVCYRGICYRRCR', 'WFKKIPKFLHLAKKF', 'AYPGNGVHCGKYSCTVDKQTAIGNIGNNAA', 'GLPVCGETCFGGTCNTPGCSCDPWPMCSRN', 'ELCEKASKTWSGNCGNTGHCDNQCKSWEGAAHGACHVRNGKHMCFCYFNC', 'GLFDVIKKVAAVIGGL', 'GFGSKPLDSFGLNFF', 'GFKLKGMARISCLPNGQWSNFPPKCIRECAMVSS', 'FAKALKALLKALKAL', 'DVKGMKKAIKGILDCVIEKGYDKLAAKLKKVIQQLWE', 'KSCCRNTWARNCYNVCRLPGTISREICAKKCDCKIISGTTCPSDYPK', 'GFFALIPKIISSPLFKTLLSAVGSALS', 'FAFGKGIGKIGKKGL', 'SIGAKILGGVKTFFKGALKELASTYLQ', 'GKWMSFLKHILK', 'RALWGLQH', 'GETFDKLKEKLKTFYQKLVEKAEDLKGDLKAKLS', 'FMPIIGRLMSGSL', 'FLPAIFRMAAKVVPTIICSITKKC', 'ADTLACRQSHQSCSFVACRAPSVDIGTCRGGKLKCCKWAPSS', 'FAKLLAKLAKKVL', 'FVLPLVMCKILRKC', 'GKWSKILGKLIR', 'CHHALTHAC', 'EVWRLAEFLAMPP', 'GVIPCGESCVFIPCISSVLGCSCKNKVCYRD', 'KWKLFKKIKFLHSAKKF', 'GLPVCGETCAGGTCNTPGCSCSWPICTRN', 'FFPIIAGMAAKLIPSLFCKITKKC', 'MPFLFCNVNDVCNFASRNDYSCNYYSNSYSFWLASLNPER', 'KLALKLALKALKAAKLA', 'GFKDLLKGAAKALVKTVLF', 'FAKKLAKKLKKLAKKLAKLALALKALALKAL', 'FLGGILNTITGLL', 'GIIKKIIIKKIIIKKI', 'ESVFSKIGNAVGPAAYWILKGLGNMSDVNQADRINRKKH', 'KWKKLLKKPPPLLKKLLKKL', 'FLPLLFGAISHLL', 'APPGARPPPGPPPPGPPPPGP', 'FKDLKKIANIINSIFKK', 'IAAHDTPGPVWLS', 'TILAEIKNINAD', 'ARLKKCFNKVTGYCRKKCKVGERYEIGCLSGKLCCAN', 'TAGIKLTVPIEKFPVTTQTFWG', 'KILRGVAKKILRTFLRRISKDILTGKK', 'AGCIKNGGRCNASAGPPYCCSSYCFQIAGQSYGVCKNR', 'GIGGKILSGLKTALKGAAKELASTYLH', 'FAKLLAKLAKAKG', 'FLPIIASVAAKVFSKIFCAISKKC', 'KWKLFKKIPKFLHSAKKF', 'FAKLLAKLAKKEL', 'GIPCGESCVFIPCITGAIGCSCKSKVCYRN', 'FAKLF', 'PRFWEAWLRLME', 'HHPHGHHPHG', 'GAFGNFLKGVAKKAGLKILSIAQCKLFGTC', 'THRPPMWSPVWPGGGKLLLKLLKKLLKLLKKK', 'GIGGVLLSAGKAALKGLAKVLAEKYAN', 'ESEFDRQEYEECKRQCMQLETSGQMRRCVSQCDKRFEEDIDWSKYDNQD', 'GIPCGESCVFIPCISSVIGCSCSSKVCYRN', 'RKAFRWAWRMLKKAAPSITCVR', 'ATCDLLSGTGVKHSACAAHCLLRGNRGGYCNGRAICVCRN', 'CHHNLTAAC', 'LGQSAASAHHAYIVLAIENSFMTASKKK', 'PAWRKAFRAAWRMLKKAA', 'KWKLFKKIPKFLHLA', 'AAKPMGITCDLLSLWKVGHAACAAHCLVLGDVGGYCTKEGLCVCKE', 'KLCGETCFKFKCYTPGCSCSYPFCK', 'FLPPSPWKETFRTS', 'GIPCAESCVWIPCTVTALVGCSCSDKVCYN', 'PRFWEYWLRAME', 'FLPVLAGIAAKVVPALFCKITKKC', 'GLFGVLGSIAKHVLPHVVPVIAEKL', 'FAKLAKKLL', 'RWKIFKKIEKMGRNIRDGIVKAGPAIEVLGSAKAIGK', 'GRKKRRQRRR', 'KLLKLLLKLYKKLLKLL', 'VAKLLAKALKKLL', 'KKKKKEGKKQ', 'FALALKA', 'GCSRWIIGIHGQICRD', 'LPKWKVFKKIEKVGRNIRNGIVKAGPAIAVLGEAKALG', 'AMVGT', 'KAAKKAWKAAKKAWKAAKKAA', 'GLFKVLGSVAKHLLPHVAPVIAEK', 'AAWKWAWAKKWAKAKKWAKAA', 'FDIVKKVVGTIAGL', 'RRRRRNWMWC', 'ATPATPTVAQFVIQGSTICLVC', 'FAKLLAKALKKFL', 'DQYKCLQHGGFCLRSSCPSNTKLQGTCKPDKPNCCKS', 'PRAWEYWLRLME', 'ATRSYGNGVYCNNSKCWVNWGEAKENIAGIVISGWASGLAGMGH', 'ERRP', 'KWKSFLKTFKSLKKTVLHTLLKAISS', 'DKLIGSCVWGATNYTSDCNAECKRRGYKGGHCGSFWNVNCWCEE', 'ACDCRGDCFCGGGGIVRRADRAAVP', 'FIITGLVRGLTKLF', 'ATCDLLSGIGVQHSACALHCVFRGNRGGYCTGKGICVCRN', 'KWKFKKIPKFLHLAKKF', 'FFPMLAGVAARVVPKVICLITKKC', 'GLFDVIKKVASVIGGL', 'KILRGVAKKIMRTFLRRISKKILTGKK', 'TRSSRAGLQFPVGRVHRLLRK', 'GNFRYLAPP', 'KRFKQDGGASHASPASS', 'YSL', 'FLPAIVGAAAKFLPKIFCAISKKC', 'FASLLGKALKALAKQ', 'FVKLKKILNIINSIFKK', 'FAKLLAKALKLKL', 'ALFSILRGLKKLGNMGQAFVNCKIYKKC', 'FAKGVGKVGKKAL', 'GLLGLLGSVVSHVLPAITQHL', 'FLPIIGKLLSGLL', 'FLSLIPSLVGGSISAFK', 'FAKLLALALKLKL', 'WKKIPKFLHLAKKF', 'FAKKLAKKLKKLAKKLIGAVLKV', 'ALWKTIIKGAGKMIGSLAKNLLGSQAQPES', 'GASCGETCFTGICFTAGCSCNPWPTCTRN', 'FKLFKKIPKFLHLAKKF', 'FAKKLAKKLKKLAKKLAKLALAL', 'FAKLLAKLAKLKL', 'MRGIRGADFQAFQQARAVGLAGTFR', 'FAKLLFKALKKAL', 'FALALKAKKL', 'CYTQYRKCQELTA', 'GLPVCGETCFGGTCNTPGCSCTWPICTRD', 'ATYYGNGLYCNKEKCWVDWNQAKGEIGKIIVNGWVNHGPWAPRR', 'FAKKLAKLAKKLAKAL', 'GCWSTVLGGLKKFAKGGLEAIVNPK', 'CGESCVFIPCITSVAGCSCKSKVCYRNGIP', 'FLPLLASLFSRLL', 'GFGCPLDQMQCHRHCQTITGRSGGYCSGPLKLTCTCYR', 'FLPKTLRKFFCRIRGGRCAVLNCLGKEEQIGRCSNSGRKCCRKKK', 'KWKKLAKKW', 'FAKKLAKLAKKALAL', 'GFGSLFKFLAKKVAKTVAKQAAKQGAKYIANKQTE', 'FLGALFKVASKVLPSVKCAITKKC', 'GIACGESCVFLGCFIPGCSCKSKVCYFN', 'FAKKLAKKLKKLAKLALAL', 'FWGHIWNAVKRVGANALHGAVTGALS', 'FALAKLAKKAKAKLKKALKAL', 'KSCCPSTTARNIYNTCRLTGASRSVCASLSGCKIISGSTCDSGWNH', 'AFGMALKLLKKVL', 'FAKLLAKKLL', 'ATAVDFGPHGLLPIRPIRIRPLCGKDKS', 'YAKLLAKLAKKAL', 'FAKKLAKLAKKLAKLALAL', 'KQLIRFLKRLDRNGGGKLLLKLLKKLLKLLKKK', 'GKWKKILGHLIR', 'DEVD', 'VNWKKLLGKLLKVVK', 'EKKPPRPPQWAVGHFM', 'KWKLFKKISKFLHLAKKF', 'KWKLFKKILKFLHLAKKF', 'ALWKNMLKGIGKLAGQAALGAVKTLVGA', 'PAWFKARRWAWRMLKKAA', 'KSCCKNTTGRNIYNTCRFAGGSRERCAKLSGCKIISASTCPSDYPK', 'FITLLLRKFICSITKKC', 'GFGCPNDYPCHRHCKSIPGRAGGYCGGAHRLRCTCYR', 'FLPLLLAGLPLKLCFLFKKC', 'CHHNLTHAC', 'FLPLIAGLIGKLF', 'GLPVCGETCVGGTCNTPGCSCSWPVCTRN', 'GLFAVIKKVAAVIKKL', 'CIWVSDGKKLWRH', 'KVKVKVKVPPTKVKVKVK', 'GIIKKIIKKI', 'MWKWFHNVLSSWQLLADKRPARDYNRK', 'APGNKAECEREKGYCGFLKCSFPFVVSGKCSRFFFCCKNIW', 'FLPILAGLAAKIVPKLFCLATKKC', 'GFFKKAWRKVKHAGRRVLDTAKGVGRHYVNNWLNRYR', 'PAWRKAFRKAWRMLKKAA', 'VNWKKVLGKIIKVAK', 'AREASKSLIGTASCTCRRAWICRWGERHSGKCIDQKGSTYRLCCRR', 'LLAGLAANFLPTIICKISYKC', 'LKKLLKWLLKLLK', 'SFLTSFKDMAIKVAKDAGVNILNTISCKIFKTC', 'NSGGAAVVAALGCAAGGVKYGRLLGPWGAAIG', 'NIPQLTPTP', 'SFLSTFKELAINAAKNAGQSLLHTLSCKLDKTC', 'DPVTCLKNGAICHPVFCPRRYKQIGTCGLPGTKCCK', 'SNDSLWYGVGQFMGKQANCITNHPVKHMIIPGYCLSKILG', 'LFGFLIPLLPHIIGAIPQVIGAIR', 'WLGSALKIGAKLLPSVVGLFKKKKQ', 'RWKVFKKIEKMGRNIRDGIVKAGPAIEVLGSAKALGK', 'TLYRRFLCKKMKGRCETACLSFEKKIGTCRADLTPLCCKEKKKH', 'KWKSFKKKLTSKFLHSAKKF', 'ASGWVCTLTIECGTVICAC', 'NIWKKIASIAKEVLKAL', 'KPWERL', 'ALWKTMLKKLGTVALHAGKAALGAAADTISQGA', 'RRAAVVLIVIRR', 'DLFQVIKEKLKELTGGVIEGIQGV', 'RWKVFKKIEKVGRNIRDGVIKAAPAIEVLGQAKAL', 'CIKNGNGCQPNGSQGNCCSGYCHKQPGWVAGYCRRK', 'KKSYPEYGSLDLRKECKMRRGHCKLQCSEKELRISFCIRPGTHCCM', 'GLLSGILGAGKHIVCGLSGLR', 'FTLKKSLLVLFFLGTISLSLCQEERAADEEDNGEVEE', 'GLLDTIKNMALNAAKSAGVSVLNTLSCKLSKTC', 'AALRGALRAVARVGKAILPHVAIANPYVRTPYVHNNP', 'IASKFICTPGCAKTGSFNSYCC', 'LLKLLKWLLKLLK', 'ITSISLCTPGCKTGALMGCNMKTATCNCSIHVSK', 'AALRGCWTKSIPPKPCSGKR', 'SLGVTLGAAGVYTATQTIATQIWKCGAVLTTSAECSRTGKSC', 'IGPDTKKCVQRKNACHYFECPWLYYSVGTCYKGKGKCCQKRY', 'FLPMLAGLAANFLPKIVCKITKKC', 'INWSSIFEKVKNLV', 'GIFSKISGKAIKNLFIKGAENVGKHVGIDVVRTGIDVVGCKIKGEC', 'GLFGKILGVGKKVLCGLSGMC', 'KVHGSLARAGK', 'GIMDTVKNAAKDLAGQLLDKLKCKITAC', 'GVLSNVIGYLKKLGTGALNAVLKQ', 'INWLKLGKMVIDAL', 'GINSLSSEMHKKCYKNGICRLECYESEMLVAYCMFQLECCVKGNPAP', 'INMKASAAVAKKLL', 'RLKLLLRLK', 'GLFLDTLKGAAKDVAGKLLEGLKCKIAGCKP', 'RFIYMKGFGKPRFGKR', 'SIFAFQDESPSAIAQAKLFK', 'GIPCGESCVFIPCITGIAGCSCKSKVCYRN', 'KTCENLANTYRGPCFTTGSCDDHCKNKEHLRSGRCRDDFRCWCTRNC', 'GLFSILKGVGKIALKGLAKNMGKMGLDLVSCKISKEC', 'SSMKLSFRARAYGFRGPGPQL', 'RSNKGFNFMVDMIQALSK', 'RLCRIVVIRVCR', 'KPYCSCKWRCGIGEEEKGICHKFPIVTYVCCRRP', 'KWKLFKKGIGAVLKV', 'TTPLCVGVIIGLTTSIKICK', 'STIVCVSLRICNWSLRFCPSFKVRCPM', 'RVCMAIPLPLCH', 'ITSFSLCTPGCAKTGSFNSYCC', 'ACQFWSCNSSCISRGYRQGYCWGIQYKYCQCQ', 'FDIMGLIKKVAGAL', 'FTMKKSPLLLFFLGTISLSLC', 'LLGDFFRKAKEKIGKEFKRIVQR', 'GVLDILKGAAKDLAGH', 'RWRWRW', 'GTQRCWNLYGKCRHRCSKKERVYVYCVNNKMCCVKPKYQPKERWWRF', 'GILDTLKNLAKTAGKGALQGLVKMASCKLSGQC', 'AILTTLANWARKFL', 'MAADIISTIGDLVKLIINTVKKFQK', 'VGECVRGRCPSGMCCSQFGYCGKGPKYCGR', 'RLARRVVIRVAR', 'VARGWKRKCPLFGKGG', 'FFPIVGKRLYGLL', 'VIDDLKKVAKKVRRELLCKKHHKKLN', 'INWLKLGKKLLSAL', 'INWLKLGKAIIDAL', 'QSINNPITCLTKGGVCWGPCTGGFRQIGTCGLPRVRCCKKK', 'KWKSFIKKLTSKFLHLAKKF', 'SLWENFKNAGKQFILNILDKIRCRVAGGCRT', 'LRDLKCFCRRKSCNWGEGIMGICKKRYGSPILCCR', 'SVLGKSVAKHLPHVVPVIAEKT', 'DDDQVEVQQEVKRGFLSTVKNLATNVAGTVIDTLKCKVTGGCRT', 'QESKKGILLKPKTCNTNADCAKFCKGPIQNCLYHTCACVPGNPHCC', 'QRPYTQPLIYYPPPPTPPRIYRA', 'QEAQSVACTSYYCSKFCGSAGCSLYGCYLLHPGKICYCLHCSR', 'SLGSFLKGVGTTLASVGKVVSDQFGKLLQAGQ', 'SMWSGMWRRKLKKLRNALKKKLKGE', 'FIKELLPHLSGIIDSVANAIK', 'GLLGSLFGAGKKVACALSGLC', 'RPRCWIKIKFRCKSLKF', 'VAGPFRIPPLRREFQ', 'GFWGKLWEGVKNAI', 'GLRSKIWLWVLLMIWQESNKFKKM', 'GILDSLKNLAKNAAQILLNKASCKLSGQC', 'IIGPVLGLVGKPLESLLE', 'QCVGTITLDQSDDLFDLNCNELQSVR', 'DTTFCRCRVSCNILEKYSGKCELSGRTARICC', 'ATAWDFGPHGLLPIRPIRIRPLCGKDKS', 'ALLDKLKSLGKVVGKVAIGVAQHYLNPQ', 'APRKNVRW', 'VTCFCRRRGCASRERHIGYCRFGNTIYRLCCRR', 'WKPFKKIEKAVRRVRDGVAKAGPAVAVVGQAT', 'ATCDLASKWNWNHTLCAAHCIARRYRGGYCNSKAVCVCR', 'GLLGAMFKVASKVLPHVVPAITEHF', 'GILDFAKTVVGGIRNALGI', 'TGVAWRIT', 'VLPIIGNLLNSLL', 'QLKSTCRIAEAWKGAKECNAKCAALGTTRGGVCQKFLGDLYCCCWD', 'MFFSSKKCKTVSKTFRGPCVRNA', 'RQRDPQQQYEQCQERCQRHETEPRHMQTCQQRCERRYEKEKRKQQKR', 'VQLRIRVRVIRK', 'GIGGALLSAGKAALKGLAKGFAEHF', 'ATCDALSFSSKWLTVNHSACAIHCLTKGYKGGRCVNTICNCRN', 'DQYRCLQNGGFCLRSSCPSHTKLQGTCKPDKPNCCRS', 'GSKKPVPIIYCNRRTGKCQR', 'AVVNGVNYVGETTAA', 'FLANQECFSEYRHCRMKCKANEYAIRYCADWTICCRVKKREAKKKIMW', 'RRICRCRIGRCLGLEVYFGVCFLHGRLARRCCR', 'ANFEIVNNCPYTVWAAASPGGGRRLDRGQT', 'SPIHACRYQRGVCIPGPCRWPYYRVGSCGSGLKSCCVRNRWA', 'GVFTLIKGATQLIGKTLGKELGKTGLELMACKITEQC', 'ILPILGNLLNSLL', 'FLSTALKVAANVVPTLFCKITKKC', 'GVLDTFKDVAIGVAKGAGTGVLKALLCKLDKSC', 'MGALIKTGAKIIGSGAAGGLGTYIGHKILGK', 'GNRPVYIPPPRPPHPRL', 'IDWLKLGKMVIDAL', 'GLGKAQCAALWLQCASGGTIGCGGGAVACQNYRQFCR', 'GIFTFEDESTTTVAPAKLYK', 'QTCASRCPRPCNAGLCCSIYGYCGSGAAYCGAGNCRCQCRG', 'RKFHEKHHSHRGYR', 'PRCPPCPRCSWCPRCPTCPRCNCNPK', 'LKWLLKWLK', 'FIGAILPAIAGLVGGLINR', 'GVFLDALKKFAKGGMNAVLNPK', 'SYVGDCGSNGGSCVSSYCPYGNRLNYFCPLGRTCCRRSY', 'IIGVSEMERCHKKGGYCYFYCFSSHKKIGSCFPEWPRCCKNIK', 'RKCLRWQWAMRKYGG', 'GLPVCGETCFGGTCNTPGCTCSYPICTRN', 'GIIDIAKKLVGGIRNVLGI', 'GPGKWLPWLQPAYDFVTGLAKGIGKEGNKNKWKNV', 'FLPAVIRVAANVLPTVFCAISKKC', 'ASVVKTTIKASKKLCKGATLTCGCNITGKK', 'IRNSLTCRFNFGICLPKRCPGRMRQIGTCF', 'GFGCPNNYQCHRHCKSIPGRCGGYCGGWHRLRCTCYRC', 'ILPIIGKILSTIF', 'ATCDLFSFRSKWVTPNHAGCAAHCIFLGNRGGRCVGTVCHCRK', 'FLPLIGKVLSGIL', 'GLFSKFAGKGIVNFLIEGVE', 'GLLSGILNTAGGLLGNLIGSLSNGES', 'FTCAISCDIKVNGKPCKGSGEKKCSGGWSCKFNVCVKV', 'KEKLKLKCKAPKCYNDKLACT', 'TTHSGKYYGNGVYCTKNKCTVDWAKATTCIAGMSIGGFLGGAIPGKC', 'KINWGNVGGSCVGGAVIGGALGGLGGAGGGCITGAIGSIWDQW', 'DEKGPKWKR', 'KWKWKWKWKW', 'GLWQKIKDKASELVSGIVEGVK', 'SIGSAFKKALPVAKKIGKAALPIAKAALP', 'KYYGNGVSCNKKGCSVDWGKAIGIIGNNSAANLATGGAAGWSK', 'GKIPVKAIKQAGKVIGKGLRAINIAGTTHDVVSFFRPKKKKH', 'GLMDMVKGAAKNLFASALDTLKCKITGC', 'RRIIIRWRRI', 'GTTVVNSTFSIVLGNKGYICTVTVECMRNCSK', 'EMHKKCYKNGICRLECYESEMLVAYCMFQLECCVKGNPAP', 'HGPDSCNHDRGLCRVGNCNPGEYLAKYCFEPVILCCKPLSPTPTKT', 'TPCGESCVYIPCISGVIGCSCTDKVCYLN', 'GLLKRIKTLL', 'FLPLLAGLAANFLPKLFCKITRKC', 'GLWSKIKETGKEAAKAAGKAALNKIAEAV', 'KWLKKWL', 'AHCLAIGRK', 'LFCKGGSCHFGGCPSHLIKVGSCFGFRSCCKWPWNA', 'MPCSCKKYCDPWEVIDGSCGLFNSKYICCREK', 'ALWKDILKNAGKAALNEINQIVQ', 'GFSSLFKAGAKYLLKSVGKAGAQQLACKAANNCA', 'KKINNPVSCLRKGGRCWNRCIGNTRQIGSCGVPFLKCCKRK', 'GLWNTKLEAGLLFAMGKLDLKRCLKAGGC', 'LSCKRGTCHFGRCPSHLIKGSCSGG', 'SIPCGESCVFIPCTVTALLGCSCKSKVCYKN', 'RVCSAIPLPICH', 'MTAQGNKPSSHDVITGRWTPSAADRAAGRVSGFGVITNIINGGLDC', 'YENPYGCPTDEGKCFDRCNDSEFEGGYCGGSYRATCVCYRT', 'FKTWKRPPFQTSCWGIIKE', 'SGISGPLSCGRNGGVCIPIRCPVPMRQIGTCFGRPVKCCRSW', 'SDYSRKRDPPQKYEEE', 'GIFSTVFKAGKGIVCGLTGLC', 'ENDHRMPYELNRPNNLSKGGAKCGAAIA', 'GDPTFCGETCRVIPVCTYSAALGCTCDDRSDGLCKRN', 'GLMDTVKNAAKNLAGQLLDTIKCKMTGC', 'NEEEKVKWEPDVP', 'KRIVQRIKDFLRNLVPRTES', 'DKLIGSCVWGAVNYTSDCNGECLLRGYKGGHCGSFANVNCWCET', 'GLLDTFKNLALNAAKSAGVSVLNSLSCKLSKTC', 'RDCRSQSKTFVGLCVSDTNCASVCLTEHFPGGKCDGYRRCFCTKDC', 'QPWLPFR', 'GLWKSLLKNVGKAAGKAALNAVTDMVNQS', 'RIIDLLWRVRRPQKPKFVTVWVR', 'GLWNSIKIAGKKLFVNVLDKIRCKVAGGCKTSPDVE', 'FLPIVAGLAANFLPKIVCKITKKC', 'FLPIIAGIAAKVFPKIFCAISKKC', 'SLQYVMSAGPYTWYKDTRTGKTICKQTIDTASYTFGVMAEGWGKTFH', 'INWKKIKSIIKAAMN', 'SDCNINSNTAADVILCFNQVGSCALCSPTLVGGPVP', 'APVPFSCTRGCLTHLV', 'RQRDPQQQYEQCQKHCQRRETEPRHMQTCQQRCERRYEKEKRKQQKR', 'APRRQLKW', 'DIGGSRQGCVA', 'QRFSQPTFKLPQGRLTLSRKF', 'SVSCLRNKGVCMPGKCAPKMKQIGTCGMPQVKCCKRK', 'ILPFVAGVAAMEMEHVYCAASKKC', 'QETCHDLIMKRDCDEATCVNMCQQKWKGSGGSCFQNFNVMSCICNFPCQV', 'ILGPVLGLVSNALGGLIKKI', 'HEPCGESCVFIPCITTVVGCSCKNKVCYN', 'GLKDKFKSMGEKLKQYIQTWKAKF', 'SRWPSPGRPRPFPGRPKPIFRPRPCNCYAPPCPCDRW', 'RVCRRRSAGFKGVCMSDHNCAQVCLQEGYGGGNCDGIMRQCKCIRQC', 'AISCGQVSSAIGPCLSYARGQGSAPSAGCC', 'SMSGFSKPHD', 'GFKDWIKGAAKKLIKTVAANIANQ', 'NWYVKKCLNDVGICKKKCKPEELHVKNGRAMCGKQRDCCVPAD', 'VFGTLGSTDDSLFGRYKQDIFNDHRGHLQGQAYGSR', 'FKCRRWQWRAKKLGA', 'SIYERCELARELINR', 'GKREKCLRRNGFCAFLKCPTLSVISGTCSRFQVCC', 'VLSIVACSSGCGSGKTAASCVETCGNRCFTNVGSLC', 'RKFHEKHHSHRGYRSNYLYDN', 'GGTIFDCGESCFLGTCYTKGCSCGEWKLCYGTN', 'GFLDTLKNMALNAAKGAGGSVLKALFCKLFKTC', 'MDVVRTLILCVCLFGLTFA', 'GFWKKVGSAAWGGVKAAAKGAAVGGLNALAKHIQ', 'GICRCLCRRGVCRCICVL', 'GRFRRLRKKTRKRLKKIGKV', 'KWKLFKKLKVLTTGL', 'AVDLAKIANIANKVLSSLFGK', 'EALYNSEDLYEETSDSDD', 'ALFSILRGLKKLGKMGQAFVNCEIYKKC', 'SWLSKTYKKLENSAKKRISEGVAIAILGGLR', 'GIGASILSAGKSALKGFAKGLAEHFAN', 'GIGAAILSAGKSALKGLAKGLAEHF', 'QSISCAESCVWIPCATSLIGCSCVNSRCIYSK', 'KRKCPKTPFDNTPGAWFAHLILGC', 'LGWGRRCPQCPRCPSCPSCPRCPRCPRCKCNPK', 'GLLDTFKNLAINAAESAGVSVLNSLSCKLSKTC', 'LRDLVCYCRKRGCKRRERMNGTCRKGHLMYTLCCR', 'GTQRCWNLYGKCRYRCSKKERVYVYCINNKMCCVKPKYQPKERWWPF', 'TNYGNGVGVPDAIMAGIIKLIFIFNIRQGYNFGKKAT', 'GLLDVVKGAAKNLLASALDKLKCKVTGC', 'FLPMLAGLAANFLPKLFCKITKKC', 'SASVLKTSIKVSKKYCKGVTLTCGCNITGGK', 'GLWQKIKNAAGDLASGIVEGIKS', 'GIFSLVKGAAKLAGKGLAKEGGKFGLELIACKIAKQC', 'RIWVIRWR', 'FLSLIPHAINAVSAIAKHN', 'GVFTFEDESTSTVAPAKLYK', 'RFRPPIRRPPIRPPFRPPFRPPVRPPIRPPFRPPFRPPIGPFP', 'GLFSVVTGVLKAVGKNVAGSLLEQLKCKISGGC', 'GTIPCGESCVFIPCLTSALGCSCKSKVCYKN', 'GFLSTVKNLATNVAGTVLDTIRCKVTGGCRP', 'GLWNSIKIAGKKLFVNVLDKIRSKVAGGS', 'GLRSKIKEAAKTAGKMALGFVNDMA', 'IDWKKVDWKKVSKKTCKVMLKACKFL', 'CFKFKFKFGSGFKFKFKFC', 'FLPAVLRVAAKVVPTVFCLISKKC', 'TVVTNA', 'DKLIGSCVWGAVNYTSNCNAECKRRGYKGGHCGSFLNVNCWCET', 'NNEAQCEQAGGICSKDHCFHLHTRAFGHCQRGVPCCRTVYD', 'PPCPSCLSCPWCPRCLRCPMCKCNPK', 'FFPTIAGLTKLFCAITKKC', 'GGGVIQTISHECRMNSWQFLFTCCS', 'LRDLVCYCRKRGCKRREHINGTCRKGHLLYMLCCR', 'VFIDILDKMENAIHKAAQAGIGIAKPIENMILPKLTK', 'GRKSDCFRKSGFCAFLKCPSLTLISGKCSRFYLCCKRIWG', 'CVKCKCKCGSGVKVKVKVC', 'GIFNVFKGALKTAGKHVAGSLLNQLKCKVSGEC', 'YPGPQAKEDSEGPSQGPASREK', 'GFMDTAKNVAKNMAVTLLDNLKCKITKAC', 'GLPGKKNVLKKSRESSGKPGGTNKKPF', 'SLFSLIKAGAKFLGKNLLKQGACYAACKASKQC', 'RAEAVPPGFTPFRKP', 'NRWTNAYSAALGCAVPGVKYGKKLGGVWGAVIGGVGGAAVCGLAGYVRKG', 'GLWSTIKQKGKEAAIAAAKAAGQAALGAL', 'IIGHLIKTALGFLGL', 'GTPGFQTPDARVISRFGFN', 'GIFPKIIGKGIVNGIKSLAKGVGMKVFKAGLNNIGNTGCNNRDEC', 'HSSGYTRPLPKPSRPIFIRPIGCDVCYGIPSSTARLCCFRYGDCCHR', 'GILLDKLKNFAKTAGKGVLQSLLNTASCKLSGQC', 'GGLKKLGKKLEGAGKRVFNAAEKALPVVAGAKAL', 'GFGCPFNQGACHRHCRSIRRRGGYCAGLIKQTCTCYRN', 'GLVTGLLKTAGKLLGDLFGSLTG', 'VGALAVVVWLWLWLW', 'LLGPVLGLVSNALGGLLKNI', 'AICKKPSKFFKGACGRDADCEKACDQENWPGGVCVPFLRCECQRSC', 'GRRRSVQWCAVSQPEATKCFQWQRNMRKVRGPPVSCIKRDSPIQCIQA', 'GGAGHVPEYFVGIGTPISFYG', 'STPVLASVAVSMELLPTASVLYSDVAGCFKYSAKHHC', 'INTWNTTATSTSIIISETFGNKGKVCTYTVECVNNCRG', 'RRWRIVVIRVRR', 'RWKVFKKIEKVGRHIRDGVIKAGPAITVVGQATAL', 'CIKNGNGCQPDGSQGNCCSRYCHKEPGWVAGYCR', 'GLVSSIGRALGGLLADVVKSKEQPA', 'RRWWRRWRRW', 'FLPAVLLVATHVLPTVFCAITRKC', 'WKKIASIGKEVLKAL', 'GATAIKQVKKLFKKWGW', 'FLPIAGKLLSGLSGLL', 'GKFSGFAKILKSIAKFFKGVGKVRKQFKEASDLDKNQ', 'FFPNVASVPGQVLKKIFCAISKKC', 'DHYNCVRSGGQCLYSACPIYTRIQGTCYHGKAKCCK', 'FVGAALKVLANVLPPVISWIKQ', 'RCICTRGFC', 'FLPIVTNLLSGLLGK', 'GFKDWIKSAAKKLIKTVASNIANQ', 'ASSGWVCTLTIECGTVICACR', 'FLPMLAGLAANFLPELFCKITKKC', 'SFLTTVKKLVTNVAALAGTVIDTIKCKITGGCRT', 'GLLSGILGAGKHIVCGLSGPCQSLNRKSSDVEYHLAKC', 'ALWKNMLSGIGKLAGQAALGAVKTLV', 'VDKPDYRPRPRPPNM', 'NLVSGLIEARKYLEQLHRKLKNCKV', 'ITSVSWCTPGCTSEGGGSGCSHCC', 'ESDTVTCRKMKGKCSFLLCPFFKRSSGTCYNGLAKCCRPFW', 'RVKRVWPLVIRTVIAGYNLYRAIKKK', 'QKIAEKFSGTRRG', 'GMASKAGAIAGKIAKVALKAL', 'LRDLVCYCRSRGCKGRERMNGTCRKGHLLYTLCCR', 'FTMKKSLLLIFFLGTISLSLCEQER', 'QKECIGPCDMFTDCQAACVGIRKGYNYGQCVAWKPKDDDPFTCCCYKLTP', 'RIWVIWRR', 'GGTIFDCGETCFLGTCYTPGCSCGNYGFCYGTN', 'GFRDVLKGAAKQFVKTVAGHIANI', 'KDRPKKPGLCPPRPQKPCVKECKNDWSCPGQQKCCNYGCIDECRDPIFVN', 'GIMDSVKNVAKNIAGQLLDKLKCKITGC', 'GWLKKIGKKIERVGQHTRDATIQGLGVAQQAANVAATAR', 'GILKKFMLHRGTKVYKMRTLSKRSH', 'MSKRDCNLMKACCAGQAVTYAIHSLLNRLGGDSSDPAGCNDIVRKYCK', 'AKKVFKRLEKLFSKIFNFK', 'SAIWFWMTPQSPK', 'SGFVLKGYTKTSQ', 'RIKRFWPVVIRTVVAGYNLYRAI', 'IAPIIVAGLGYLVKDAWDHSDQIISGFKKGWNGGRRK', 'WFYQGMNIAIYANIGGVANIIGYTEAAVATLLGAVVAVAPVVP', 'FLGGLWKAMSNLL', 'NCIQQCVSKGAQGGYCTNEKCTCY', 'KRCHLTIDKATACSLSDCRLSCYSGYNGVGKCFDDPKVAGPSNCGCIYNC', 'DHYNCVKGGGQCLYSACPIYTKVQGTCYGGKAKCCK', 'IIGLVSKGTCVLVKTVCKKVLKQG', 'GLFTLIKGAYKLDAPTVACN', 'KWKSFIKKLTSKFLHSADKF', 'SLFSLIKAGAKFLGKNLLKQGAQYAACKVSKEC', 'SIVPIRCRSNRDCRRFCGFRGGRCTYARQCLCGY', 'WNPFKELEKVGQRVRDAVISAGPAVATVAQATALAK', 'KTKLTEEEKNRLNFLKKISQRYQKFALPQYLKTVYQHQK', 'GVCDMADLA', 'VIVFVASVAAEMMQHVYCAASKKC', 'LLPIVGNLLNSLL', 'GIFSKINKKKAKTGLFNIIKTVGKEAGMDVIRAGIDTISCKIKGEC', 'FKARRWQWRMKKLGA', 'RECRSESKKFVGLCVSDTNCASVCLTERFPGGKCDGYRRCFCTKDC', 'RCRFCCRCCPRMRGCGICCRF', 'RTCASQSQRFKGKCVSDTNCENVCHNEGFPGGDCRGFRRRCFCTRNC', 'RGKRWWRRKK', 'GLKDIFKAGLGSLVKNIAAHVAN', 'FLPAIVGAAGKFLPKIFCAISKKC', 'QPFSLERW', 'GLMSTLKGAATNVAVTLLNKLQCKLTGTC', 'RWKLFKKIEKVGRNVRDGLIKAGPAIAVIGQAKSL', 'ITSHSLCTPGCAKTGSFNSFCC', 'SHQDCYEALHKCMASHSKPFSCSMKFHMCLQQQ', 'LRDLVCYCRKRGCKGRERMNGTCRKGHLLYTMCCR', 'QLINSPVTCMSYGGSCQRSCNGGFRLGGHCGHPKIRCCRRK', 'GLAGAISSALDKLKQSQLIKNYAKKLGYPR', 'RILSILRHQNLLKELQDLALQGAK', 'AVNIPFKVKFRCKAAFC', 'GLWNSIKIAGKKLFVNVLDKIRCKVAGGCKTSPDVEYHK', 'RLSRIVVIRVCR', 'LRDLVCYCRARGCKGRERMNGTCSKGHLLYMLCC', 'TVYTNA', 'ILGPVIKTIGGVIGGLLKNL', 'ATCDILSFQSQWVTPNHAGCALHCVIKGYKGGQCKITVCHCRR', 'GIGAAILSAGKSIIKGLANGLAEHF', 'GFSSIFRGVAKFASKGLGKDLARLGVNLVACKISKQC', 'GLLSGLKKVGKHVAKNVAVSLMDSLKCKISGDC', 'EFKRCWKGQGACQTYCTRQETYMHLCPDASLCCLSYALKPPPVPKHEYE', 'LIGSLFRGAKAIFRGARQGWRSHKAVSRYRARYVRRPVIYYHRVYP', 'QDRPKKPGLCPPRPQKPCVKECKNDWSCPGQQKCCNYGCIDECRDPIFVN', 'GFMDTAKNVAKNVAATLLDKLKCKITGGC', 'IFGAILPLALGALKNLIK', 'ILGAILPLVSGLLSNKL', 'SVFAFQDESTSTIAQARLFI', 'GICACRRRFCLNFEQFSGYCRVNGARYVRCCSRR', 'ANKCIIDCMKVKTTCGDECKGAGFKTGGCALPPDIMKCCHNC', 'KLLKWLLK', 'EKYTEAPEYI', 'QAFKTFTPDWNKIRNDAKRMQDNLEQMKKRFNLNL', 'GLFSVLGSVAKHLLPHVVPVIAEKL', 'KWKSFINKLTSKFLHSAKKF', 'INLKAIAALAKKLLG', 'INWKKIFESVKNLV', 'LLGDFFRKAREKIGEEFKRIVQRIKDFLRNLVPRTES', 'FLSGIVGMLGKLFGK', 'FVPYNPPRPGQSKPFPSFPGHGPFNPKIQWPYPLPNPGH', 'GIPCGESCVYIPCLTSAIGCSCKSKVCYRN', 'GFWGSLWEGVKSVV', 'ARIQESTNDILKPITCNTNADCAKFCKGPIHNCVYHTCQCVPGNPHCC', 'KLLKWLKKLLK', 'GLLGGLLGPLLGGGGGGGGGLL', 'GNNRPVYIPQPRPPHPRI', 'KSCCRSTLGRNCYNLCRVRGAQKLCANACRCKLTSGLKCPSSFPK', 'GVIAAAKKVVNVLKNLF', 'ESEFDRQEYEECKRQCMQLETSGQMRRCVSQCDKRFEEDIDWSKYDNQE', 'ANCSCSTASDYCPILTFCTTGTACSYTPTGCGTGWVYCACNGNFY', 'QYGRRCCNWGPGRRYCKRWC', 'GIVDFAKGVLGKIKNVLGI', 'RRCICTTRTCRFPYRRLGTCIFQNRVYTFCC', 'GIFLDKLKNFAKGVAQSLLNKASCKLSGQC', 'RRWKIVVIRWRR', 'KTHYPTNAWKSLWKGFWESLRYTDGF', 'LFGFLIKLIPSLFGALSNIGRNRNQ', 'FFSLIPSLIGGLVFAIK', 'EQPGGDKVNLGYFTN', 'FLSLIPHAINAVSALVHHF', 'LFGLIPSMMGGLVSAFK', 'YVSCLFRGARCRVYSGRSCCFGYYCRRDFPGSIFGTCSRRNF', 'QRFIHPTYRPPPQPRRPVIMRA', 'GGYYCPFFQDKCHRHCRSFGRKAGYCGGFLKKTCICV', 'ATCDLLSGFGVGDSACAAHCIARRNRGGYCNAKTVCVC', 'NWRKILGKIAKVAAGLLGSMLAGYQV', 'EGPVGLADPDGPASAPLGAP', 'VLSHNNESSYSDTSSCTSQ', 'FKCRRWQWR', 'NKGCAICSIGAACLVDGPIPDFEIAGATGLFGLWG', 'GWKSVFRKAKKVGKTVGGLALDHYLG', 'FKCARWQWRMKKLGA', 'RNKLAYNMGHYAGKATIFGLAAWALLA', 'SCNCVCGVCCSCSP', 'FLPLIASLAANFVPKIFCKITKKC', 'GLFDIIKKVASVVGLASP', 'LNLKGIFKKVASLLT', 'ALLHHGLNCAKGVLA', 'GLMSVLKGVLKTAGKHIFKNVGGSLLDQAKCKITGQC', 'GYGCPFNQYQCHSHCRGIRGYKGGYCTGRFKQTCKCY', 'FTMKKSLLFIFFLGTISLSLC', 'LLDVLLE', 'FLPLLAGVVANFLPQIICKIARKC', 'RTCESQSHRFHGTCVRESNCASVCQTEGFIGGNCRAFRRRCFCTRNC', 'GLGSILGKILNVAGKVGKTIGKVADAVGNKE', 'ESGINLQGDATLANN', 'QLKKCWNNYVQGHCRKICRVNEVPEALCENGRYCCLNIKELEAC', 'FFPLIAGLAANFLPQILCKIARKC', 'RYCPRNPEACYNYCLRTGRPGGYCGGRSRITCFCFR', 'SIITMTREAKLPQLWKQIACRLYNTC', 'SGRGKTGGKARAKAKTRSSRAGLQFPVGRVHRLLR', 'GLLSSLSSVA', 'GILSTIKDFAIKAGKGAAKGLLEMASCKLSGQC', 'RDCESDSHKFHGACFSDTNCANVCQTEGFTAGKCVGVQRHCHCTKDC', 'DCTRWIIGINGRICRD', 'GAPICGESCFTGKCYTVQCSCSWPVCTRN', 'ALWKTLLKKVGKVAGKAVLNAVTNMANQNEQ', 'GIINMLQKSYCKIRKGRCALLGCLPKEEQIGSCSVSGRKCCRKKK', 'APRWKFGKRLEKLGRNVFRAAKKALPVIAGYKAL', 'HFLGKLVNLAKKIL', 'SVLGTVKDLLIGAGKSAAQSVLTTLSCKLSNSC', 'GWLRKAAKSVGKFYYKHKYYIKAAWKIGRHAL', 'SAVGRHGRRFGLRKHRKH', 'SISCGESCAMISFCFTEVIGCSCKNKVCYLN', 'ALWKDVLKKIGTVALHAGKAALGAVADTISQ', 'FWATLAKGALKLIPTIANAFSSKS', 'FLFSLIPHAISGLISAFK', 'RVCESQSHGFKGACTGDHNCALVCRNEGFSGGNCRGFRRRCFCTLKC', 'DLPECCSATELELDSGKQTS', 'TSRCYIGYRRKVVCS', 'KIKWFKTMKSIAKFIAKEQMKKHLGGE', 'RQRDPQQQYEQCQKHCQRRETEPRHMQTCQQRCERRYEKEKRKQQ', 'GSRYLCTPGSCWKLVCFTTTVK', 'KWLLKWL', 'GVVTDLLNTAGGLLGNLVGSLSG', 'SIGTAVKKAVPIAKKVGKVAIPIAKAVLSVVGQLVG', 'GLLNTFKDWAISIAKGAGKGVLTTLSCKLDKSC', 'QGVRNRLSCHRNKGVCVPSRCPRHMRQIGTCRGPPVKCCRKK', 'SALVGCWTKSWPPKPCFGRG', 'LDTIKCLQGNNNCHIQKCPWFLLQVSTCYKGKGRCCQKRRWFARSHVYHV', 'FLPVILPVIGKLLNGIL', 'GWLKKLGKRIERIGQHTRDATIQGLGIAQQAANVAATAR', 'KNLRRIIRKIIHIIKKYG', 'ALRLAIRKR', 'SFPFFPPGICKRLKRC', 'QTCASRCPRPCNAGLCCSIYGYCGSGNAYCGAGNCRCQCRG', 'KKLLKWLLKLL', 'KINWGSVGGSCVGGAVIGGALGGLGGAGGGCLTGAIGSIWDQW', 'SLLGTVKDLLIGAGKSAAQSVLKGLSGKLSKDC', 'GLFSKFNKKKIKSGLIKIIKTAGKEAGLEALRTGIDVIGCKIKGEC', 'CPAIQRCCQQLRNIQPPCRCCQ', 'RVKRFWPLVPVAINTVAAGINLYKAIRRK', 'GLNTLKKVFQGLHEAIKLINNHVQ', 'KWKLFKKAVLKVLTT', 'KKKSGVIPTVSHDCHMNSFQFVFTCCS', 'FDNPFGCPADEGKCFDHCNNKAYDIGYCGGSYRATCVCYRK', 'MTPFWRGVSLRPIGASCRDDSECITRLCKKRRCSLSVAQE', 'RLKELITTGGQKIGEKIRRIGQRIKDFFKNLQPREEKS', 'GLLSGILGAGKNIVCGLSGLC', 'GLLNGLALRLGKRALKKIIKRLCR', 'GIGTKIIGGLKTAVKGALKELASTYVN', 'GLFRRLRDSIRRGQQKILEKARRIGERIKDIFRG', 'ATKVKAKQRGKEKVSSGRPGQHN', 'GLWKSLLKNVGKAAGKAALNAVTDMVNQA', 'GIFSKLAGKKLKNLLISGLKSVGKEVGMDVVRTGIDIAGCKIKGEC', 'WNDTGKDADGAEY', 'FKTWKRPPFQTSCSGIIKE', 'KWKSFIKKLASKFLHSAKKF', 'GLFDVIKKVASVIGLASP', 'RISFKKGKGSWIKNGLIKGIKGLGKEISLDVIRTGIDIAGCKIKGEC', 'RLSRIVVIRVSR', 'GWLRKLGKKIERIGQHTRDASIQVLGIAQQAANVAATAR', 'GNGVLKTISHECNMNTWQFLFTCC', 'GIMRVFKGVLKTAGKSVAKNVAGSFLDRLKCKISGGC', 'FLPLLAGLAANFLPKIFCKITKKC', 'GKIPVKAIKKAGAAIGKGLRAINIASTAHDVYSFFKPKHKKK', 'LPVNEAQCRQVGGYCGLRICNFPSRFLGLCTRNHPCCSRVWV', 'DKLIGSCVWGAVNYTSRCNAECKRRGYKGGHCGSFANVNCWCET', 'KGIGSALKKGGKIIKGGLGALGAIGTGQQVYEHVQNRQ', 'KKCRERGGQCHSGVCSWNEKFIGFCSFARPCC', 'ILGKILKGIKKLF', 'INLLKIAKGIIKSL', 'INWKKIFEKVKDLV', 'DYHHGVRVL', 'RIKRFWPVVIRTVVAGY', 'GIGALSAKGALKGLAKGLAEHFAN', 'VFIDILDKMENAIHKAAQAGIGLAKPIENMILPK', 'KWLKKLLKKLL', 'GIFGKILGVGKKVLCGLSGVC', 'YPASMDNYDDALEELDNLDLDDYFDLEPADFVLLDMWANMLESSDFDDME', 'KRKKHRCRVYNNGMPTGMYRWC', 'SVMGTVKDLLIGAGKSAAQSVLKSLSCKLSNDC', 'IDWKKIFEKVKNLV', 'GLLKPLLKIAAKVGSNLL', 'ADDRNPLEECFRETDYEEFLEIARNGLKKT', 'ILSAIWSGIKS', 'FLPPSPWKETFRTT', 'GGLKKFGKKLEGVGKRVFKASEKALPVVTGFKAL', 'FLGLIFHGLVHAGKLIHGLIHRNRG', 'GLLDFAKHVIGIASKLG', 'KVFLGLK', 'FLPKLFAKITKKNMAHIR', 'ILSAIWSGIKGLL', 'GMSGYIQGIPDFLKGYLHGISAANKHKKGRL', 'ILGKILEGIKSLF', 'GIFTKINKKKAKTGVFNIIKTIGKEAGMDVIRAGIDTISCKIKGEC', 'GLFSKFAGKGIKDLIFKGVKHIGKEVGMDVIRVGIDVAGCKIKGVC', 'RGGRLCYCRPRFCVCVGR', 'VRPYLVAF', 'KVPIGAIKKGGKIIKKGLGVIGAAGTAHEVYSHVKNRQ', 'ALLLAIRKR', 'GIMDTVKNAAKDLAGQLLDKLKCRITGC', 'RGLRRLGRKIAHGVKKYGPTVLRIIRIAG', 'RLKLLLLRLK', 'FLSLIPTAINAVSALAKHF', 'GSPIQCAETCFIGKCYTEELGCTCTAFLCMKN', 'LTVRAAQSFGRCNQKQCDADCVKKGYFGGLCTLTSCFCTGSRS', 'KPWERE', 'GGLKKLGKKLEGAGKRVFKASEKALPVVVGIKAIGK', 'GIGCGESCVWIPCVSAAIGCSCSNKICYRN', 'GILGNIVGMGKKIVCGLSGLC', 'FLGGLMKAFPALICAVTKKC', 'LALKSGGWLRLFGLKDKKH', 'FFGHLFRGIINVGKHIHGLLSG', 'FINLLDKVEDALHTGAQAGFKLIRPVERGATPKKSEKPEK', 'GIGSAILSAGKSALKGLAKGLAEHFAN', 'GSEIQPR', 'ILGPVIGTIGNVLGGLLKNL', 'GKIPVKAIKKGGQIIGKALRGINIASTAHDIISQFKPKKKKNH', 'FPMKKSLLLIFFLGTINLSFCEEERNAEEEKRDGDDEMDVEVQKR', 'FDITKLNIKKLTKATCKVISKGASMCKVLFDKKKQE', 'GIMDTVKNAAKDLAGQLDKLKCRITGC', 'GIFSKISGKAIKNLFIKGAKNVGKEVGIDVVRTGMDVVGCKIKGEC', 'INWKGIAAMAKKLL', 'GLISGILGVGKMLVCGLSGLC', 'GIGASILSAGKSALKGLAKGLAEHFAN', 'GVIPCGESCVFIPCISAAIGCSCKNKVCYRN', 'YVPLPNVPQPGRRPFPTFPGQGPFNPKIKWPQGY', 'ALWKTLLKGAGKVFGHVAKQFLGSQGQPES', 'YPASYDDDFDALDDLDDLDLDDLLDLEPADLVLLDMWANMLDSQDFEDFE', 'RRWVIWRR', 'GFMDTAKQVAKNVAVTLIDKLRCKVTGGC', 'GLFGILGSVAKHVLPHVVPVIAEHS', 'QYRHRCCAWGPGRKYCKRWC', 'SRDLICYCRKGGCNRGEQVYGTCSGRLLYCCPRR', 'NLCERASLTWTGNCGNTGHCDTQCRNWESAKHGACHKRGNWKCFCYFNC', 'SIITMTKEAKLPQLWKQIACRLYNTC', 'RECQSQSHRYKGACVHDTNCASVCQTEGFSGGKCVGFRGRCFCTKHC', 'RRWCFRVCYKGFCYRKCR', 'LKWLKKWLK', 'AHDGNPLEECFREDDEEFFLEIAKNGLTATSNPKRVVIV', 'FFSMIPKIATGIASLVKNL', 'HICHDYLEGDHCDPKDCNLDCRDKWKGTGTCEPPTGTPLTRTCYCTYDC', 'QCRRLCYKQRCVTYCRGR', 'DERCTIIIHPGSPCDPSDCVQYCYAEYNGVGKCIASKPGRSANCMCTYNC', 'GLVSGLLNTAGGLLGDLLGSLGSLSG', 'FLSLIPHAINAISAIANHF', 'KSTCKAESNTFPGLCITKPPCRKACLSEKFTDGKCSKILRRCICYKPC', 'LRDLVCYCRKRGCKRREHMNGTCRKGHLMYTLCCR', 'FLIIRRPIVLGLL', 'ILFSYLLFYVLKENSKREDKYQNIIEELTELLPKIKEDVEDIKEKLNK', 'RCTCTTIISSSSTF', 'RRLCRIVWVIRVCRR', 'GICRCICTRGFCRCICVL', 'GSNKGFNFMVDMINALSN', 'WLGSALKIGAKLLPSVVGLFQKKKK', 'KKKKQSWYAAAGDAIVSFGEGFLNAW', 'DLVCYCRARGCKGRERMNGTCRKGHLLYMLCCR', 'GLLSFLPKVIGVIGHLIHPPS', 'ATNIPFKVHFRCKAAFC', 'TTPVCAVAATAAASSAACGWVGGGIFTGVTVVVSLKHC', 'KNLRRITRKIIHIIKKYG', 'FLGSLLGLVGKIVPTLICKISKKC', 'DNGEAGRAAR', 'RVCYAIPLPICY', 'YQWQRRMRKL', 'VSGNVAARKGKQQTSSGKGGGTN', 'GNGVIKTISHECHMNTWQFIFTCCS', 'VTCDLLSFEAKGFAANHSICAAHCLVIGRKGGACQNGVCVCRN', 'IWNKIAKSIGKVLEKAL', 'GLVDVLGKVGGLIKKLLP', 'GFMNTAKNVAKNVAVTLLDNLKCKITGGC', 'SMLSVLKNLGKVGLGLVACKINKQC', 'FNRGGYNFGKSVRHVVDAIGSVAGIRGILKSIR', 'KWKSFIKKSTSKFLHSAKKF', 'LLGRCKVKSNRFNGPCLTDTHCSTVCRGEGYKGGDCHGLRRRCMCLC', 'DLDVNVFNR', 'RLARIVVIRWAR', 'IFGAIAGLLKNIF', 'KWKSFIKKLTSAAKKVVTTAKPLISS', 'RWKIFKKIEKMGRNIRDGIVKAGPAIEVLGSAKAI', 'FLPVIAGLAAKVLPKLFCAITKKC', 'TSYGNGVHCNKSKCWIDVSELETYKAGTVSNPKDILW', 'GLVASIGRALGGLLADVVKSKEQPA', 'FLPLLASLFSRLF', 'GIFDKLKNFAKGVAQSLLNKASCKLSGQC', 'RLKRMTPFWRGVSLRPVGASCRDNSECITMLCRKNRCFLRTASE', 'FLENQDCSKHRHCRMKCKANEYAVRYCEDWTICCRVKKKESKKKKMW', 'GKLQAFLAKMKEIAAQTL', 'FLPFFASLLGKLL', 'GCTQWINNIHGRICVRN', 'DCKHPVGPYTDSCFTDCVSGKYGYNYESAFCSRDETGTCKICCCELINE', 'GIFTLIKGAAKLIGKTVAKEAGKTGLELMACKITNQC', 'ACQCPDAISGWTHTDYQCHGLENKMYRHVYAICMNGTQVYCRTEWGSSC', 'GRCVCRKQLLCSYRERRIGDCKIRGVRFPFCCPR', 'VTCDILSVEAKGVKLNDAACAAHCLFRGRSGGYCNGKRVCVCR', 'GLLDSLKGFAATAGKGVLQSLLSTASCKLAKTC', 'LKWLKKLLKKL', 'GLVDVLGKVGGLIKKLLPG', 'WLRRIGKGVKIIGGAALDHL', 'RYHMQCGYRGTFCTPGKCPHGNAYLGLCRPKYSCCRWL', 'ITSISLCTPGCKTGVLMGCNLKTATCNCSVHVSK', 'MLMACYSAGQLGCLVFCNEAEYSYGKCIGRGRCCCYDL', 'GWLKKIGKKIERVGQHTRDATIQTIAVAQQAANVAATAR', 'LRDLVCYCRTRGCKRRERMNGTCRKGHLIYTLCC', 'GLWSNIKTAGKEAAKAALKAAGKAALGAVTDAV', 'GRLKKLGKKIEGAGKRVFKAAEKALPVVAGVKALG', 'VDKGSYLPRPTPPRPIYNRN', 'QQCGRQAGNRRCANNLCCSQYGYCGRTNEYCCTSQGCQSQCRRCG', 'GVWSTVLGGLKKFAKGGLEAIVNPK', 'GLLDTFKNLALNAPKSAGVSVLNSLSCKLSKTC', 'KQFRIRVRVIRK', 'KWCFRVCYRGICYRKCR', 'GLWDSIKIAGKKLFVNVLDKIRCKVAGGC', 'VAIALKAAHYHTHKE', 'GIINTLQKYYCRVRGGRCAVLTCLPKEEQIGKCSTRGRKCCRRKK', 'LIGPVLGLVGSALGGLLKKI', 'SGKLYYRRKK', 'EPILGIITSLLKSL', 'ACHAHCQSVGRRGGYCGNFRMTCYCY', 'AIHRALISKRMEGHCEAECLTFEVKIGGCRAELAPFCCKNRKKH', 'AWLLAIRKR', 'GMATKAGTALGKVAKAVIGAAL', 'ILGPVLGLVSNALGGLLKNL', 'KNGYGGSGNRWVHCGAGIVGGALIGAIGGPWSAVAGGISGGFASCH', 'HKTDSFVGLM', 'ALWLAIRKR', 'QGVRSYLSCWGNRGICLLNRCPGRMRQIGTCLAPRVKCCR', 'NFLDTLINLAKKFI', 'QLEARFEPKQRNFRKRELDFEKLFANMPDY', 'RRARIVVIRVAR', 'LLGNFFRKAREKIGKEFKRIVQRIKDFLQHLVPRTEA', 'GVVDILKGAAKDLAGHLASKVMNKI', 'GWMSKIASGIGTFLSGVQQG', 'RLGDILQKAREKIEGGLKKLVQKIKDFFGKFAPRTES', 'GLISGILGVGKKLVCGLSGLC', 'GVLDAFKKIATVVKNLV', 'TTKNYGNGVCNSVNWCQCGNVWASCNLATGCAAWLCKLA', 'SLWETIKNAGKGFIQNLDKIR', 'KYYGNGVTCGKHSCSVNWGQAFSCSVSHLANFGHGKC']\n" ] } ], "source": [ "neg_seq = []\n", "neg_id= []\n", "\n", "for seq_record in SeqIO.parse(\"/content/drive/MyDrive/Briefings in Bioinformatics/Sequence/Sequence2/neg_train_main.fasta\", \"fasta\"):\n", " neg_seq.append(str(seq_record.seq))\n", " neg_id.append(str(seq_record.id))\n", "pos_seq = []\n", "pos_id= []\n", "\n", "for seq_record in SeqIO.parse(\"/content/drive/MyDrive/Briefings in Bioinformatics/Sequence/Sequence2/pos_train_main.fasta\", \"fasta\"):\n", " pos_seq.append(str(seq_record.seq))\n", " pos_id.append(str(seq_record.id))\n", "seqs=pos_seq + neg_seq\n", "dfclass = pd.DataFrame({'class' : np.repeat((1,0), (689, 689))})\n", "y=dfclass['class']\n", "print(seqs)" ] }, { "cell_type": "code", "execution_count": 5, "metadata": { "id": "TS7_OTBCTHXe", "colab": { "base_uri": "https://localhost:8080/" }, "outputId": "28a6bd61-79ee-4b56-bd25-bcdb01ceaa69" }, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "['FLWWLFKWAWK', 'FAKLAKKALAKLL', 'GLFDIVKKIAGHIAGSI', 'VNFKKLLGKLLKVVK', 'WKKIPKFLHLLKKF', 'EQCGRQAGGKLCPNNLCCSQYGWCGSSDDYCSPSKNCQSNCKGGG', 'EADEPLWLYKGDNIERAPTTADHPILPSIIDDVKLDPNRRYA', 'FVGLAKVAAHVVPAIAEHF', 'FAKLLAKLAKKFAL', 'ARSYGNGVYCNNKKCWVNRGEATQSIIGGMISGWASGLAGM', 'KWKLFKKIGIGAFLHSAKKF', 'GIGKFLHSAKKWGKAFVGQIMNC', 'PAWRKAFRWAWRMLKKAA', 'FAKLLAKALKKLL', 'AIGKFLHSAKKFGKAFVGEIMNS', 'KRFKQDGGWSHWSPWSSC', 'FLPIALKALGSIFPKIL', 'TESYFVFSVGM', 'CLGIGSCNDFAGCGYAVVCFW', 'GMWSKILGHLIK', 'GFGALFKFLAKKVAKTVAKQAAKQGAKYVVNKQME', 'GMWSKILGHLKR', 'FKCRRWQWRMKKLGAPSITCVR', 'KWKLFKKIGIGAFLHLAKKF', 'CGESCVWIPCISAAIGCSCKNKVCYRAIP', 'KWKSFAKTFKSAKKTVAHTALKAISS', 'KSCCPNTTGRNIYNTCRFGGGSREVCARISGCKIISASTCPSDYPK', 'GKFMSLLKHILK', 'FAKKLKKLAKKL', 'FAKLLAKLAKKSL', 'FLPIIAKVLSGLL', 'ITCPQVTQSLAPCVPYLISG', 'FAKLLAKLAKKIL', 'FAKKLAKKLAKAAL', 'FAKLLAKLAKKAA', 'FLGWLFKWASK', 'GIGAVLKVLTTGLPALISWIKRKRQQ', 'FNRGGYNFGKSVRHVVDAIGSVAGILKSIR', 'GVPCGESCVFIPCITGVIGCSCSSNVCYLN', 'FFPVIGRILNGIL', 'KMWSKILGHLIR', 'FALALKALKKLKKALKKAL', 'FLGALFKALSKLL', 'FFPNVASVPGQVLLKKIFCAISKKC', 'GEYCGESCYLIPCFTPGCYCVSRQCVNKN', 'FLSLIPHIVSGVAALAKHL', 'SQETFSDLWKLLPEN', 'WHSDMEWWYLLG', 'FAEPLPSEEEGESYSKEPPEMEKRYGGFM', 'PAWRKAFRWAARMLKKAA', 'VNWKKILGKIIKVAK', 'GLFDIVKKIAGHIASSI', 'WFKKIPKFLHLLKKF', 'GIIKKIIKKIIKKI', 'KWKSFLKTFKSLKKTVLHTALKAISS', 'FAKKLAKALL', 'FLGWLFKWAKK', 'ACYCRIPACLAGERRYGTCFYRRRVWAFCC', 'FALAKALKKAL', 'GKWKKILGKLIR', 'LALMLPGC', 'FALALKALKKA', 'FLKLLKKLAAKLF', 'DILTFEHYWAQLTS', 'VAKFLAKFLKKAL', 'FRGLAKLLKIGLKSFARVLKKVLPKAAKAGKALAKSMADENAIRQQNQ', 'VNWKKVLGKVVKVVK', 'MWKWFHNVLSWWWLLADKRPARDYNRK', 'GSEGPLKPGARIFSFDGKDVLRHPT', 'LLGMIPLAISAISALSKL', 'FLPVIAGVAAKFLPKIFCAITKKC', 'ILGPVISTIGGVLGGLLKNL', 'FWGALAKGALKLIPSLFSSFSKKD', 'GIGVLLSAGKAALKGLAKVLAEKYAN', 'LGFWGLPH', 'RRRRRRRRGNLWAAQRYGRELRRMSDEFVDSFKK', 'LVRGCWTKSYPPKPCFVR', 'GLFKVIKKVASVIGGL', 'FLSHIAGFLSNLF', 'FLGAIAAALPHVINAVTNAL', 'FALALKALKKAL', 'FAKKLAKKAKLAKKL', 'CSCRTSSCRFGERLSGACRLNGRIYRLCC', 'FAKKLAKKLL', 'GLLGLLGSVVSHVVPAIVGHF', 'FVDLKKIANIINSIFKK', 'FLIGMTHGLICLISRKC', 'KAAKKAAKAAKKAAKAAKKAA', 'GLPVCGETCFGGTCNTPGCACDPWPVCTRD', 'GLFDIVKKVVGTLAGL', 'GRRKRKWLRRIGKGVKIIGGAALDHL', 'KLAKLAKKLAKLAK', 'PNEVNRLAHLRLH', 'GLFGVLGSIAKHVLPHVVPVIAEK', 'GLPICGETCVGGSCNTPGCSCSWPVCTRN', 'PDEDAINNALNKVCSTGRRQRSICKQLLKK', 'GLFKVLGSVAKHLLPHVVPVIAEK', 'GLFDIIKKVASVIGGL', 'KAAKKWAKAAKKAAKAWKKAA', 'GSLCGDTCFVLGCNDSSCSCNYPICVKD', 'KWKLF', 'YKQCHKKGGHCFPKEKICLPPSSDFGKMDCRWRWKCCKKGSG', 'GLPTCGETCFGGTCNTPGCTCDPWPVCTHN', 'AIPCGESCVWIPCISTVIGCSCSNKVCYR', 'FLSLALAALPKFLCLVFKKC', 'PAWRKARRWAWRMKKLAA', 'FLPGLIAGIAKML', 'KAKLAKKALAKLL', 'GGLRSLGRKILRAWKKYGPIIVPIIRIG', 'PRFWEYWLALME', 'FLPVIAGLLSKLF', 'GLFDVIKAVASVIGGL', 'FFGSVLKVAAKVLPAALCQIFKKC', 'FAKLLAKLAKKAL', 'FLKLLKKLAAKFLPTIICKISYKC', 'YCAYYSPRHKTTF', 'HHPHGHHPHGHHPHGHHPHG', 'GACFSIAHECGA', 'VRRFPWWWPFLRR', 'FLPILINLIHKGLL', 'FLSIIAKVLGSLF', 'FFSASCVPGADKGQFPNLCRLCAGTGENKCA', 'FIHHIIGGLFSAGKAIHRLIRRRRR', 'PPKSQ', 'KKKFPWWWPFKKKCKKKFPWWWPFKKKC', 'VAKKFAKKFKKFAKKFAKFAFAF', 'GLLSVLGSVVKHVIPHVVPVIAEHL', 'FGKGIGKVGKKLL', 'AWKLFDDGV', 'PEWFKCRRWQWRMKKLGA', 'YERDPRQQYEQCQRRCESEATEEREQEQCEQRCEREYKEQQRQQEEE', 'FALALKALKK', 'GLFDVIAKVASVIKKL', 'CAHNLTHAC', 'GIGKFLKKAKKGIGAVLKVLTTGL', 'ATCKAECPTWDSVCINKKPCVACCKKAKFSDGHCSKILRRCLCTKEC', 'PAWRKAARWAWRMLKKAA', 'GIGTKILGGVKTALKGALKELASTYAN', 'CIKNGNGCQPNGSQNGCCSGYCHKQPGWVAGYCRRK', 'FALALKALKKALKKLKKALKKAL', 'FLSLLPSIVSGAVSLAKKL', 'ACYCRIGACVSGERLTGACGLNGRIYRLCCR', 'ATCDLLSMWNVNHSACAAHCLLLGKSGGRCNDDAVCVCRK', 'FLPVIAGVAANFLPKLFCAISKKC', 'GFLDTFKNLALNAAKSAGVSVLNSLSCKLFKTC', 'QSHLSLCRWCCNCCRSNKGC', 'ALWKNMLKGIGKLAGKAALGAVKKLVGAES', 'KWKLFKKIGIGKFLHLAKKF', 'FDIVKKIAGHIAGSI', 'CSTNTFSLSDYWGNKGNWCTATHECMSWCK', 'KSCCKNTTGRNIYNTCRFAGGSRERCAKLSGCKIISASTCPSYPDK', 'FFHHIFRGIVHVGKTIHRLVTG', 'AISYGNGVYCNKEKCWVNKAENKQAITGIVIGGWASSLAGMGH', 'ETCASRCPRPCNAGLCCSIYGYCGSGAAYCGAGNCRCQCRG', 'GFRDVLKGAAKAFVKTVAGHIANI', 'LGGIVSAVKKIVDFLG', 'GIIKKIIIKKIIIKKIIIKKI', 'GIGKFLHSAKKFAKAFVAEIMNS', 'FALA', 'KNWKKILKKIIKVVK', 'KILRGVCKKIMRTFLRRISKDILTGKK', 'SPLGYGFAVRNSG', 'GLFGKLIKKFARKAISYAVKKARGKH', 'ANTAFVSSAHNTQKIPAGAPFNRNLRAMLADLRQNAAFAG', 'PDEDAINDALNKVCSTGRRQRSICKQLLKK', 'FAFGKGIGKVGKKLL', 'FAKKLLAKALKL', 'CHANLTHAC', 'FKSWSFCTPGCAKTGSFNSYCC', 'FKRLAKIKVLRLAKIKR', 'FLPLILRKIVTAL', 'ATCDLLSAFGVGHAACAAHCIGHGYRGGYCNSKAVCTCRR', 'LLKELWTKIKGAGKAVLGKIKGLL', 'DWTFANWSCLVCDDCSVNLTV', 'GIPCGESCVWIPCISAALGCSCKNKVCYRN', 'GLIGSIGKALGGLLVDVLKPKL', 'VLPLISMALGKLL', 'FISAIASMLGKFL', 'SAISCGETCFKFKCYTPRCSCSYPVCK', 'INWKKIASIGKEVLK', 'DSHAKRHHGYKRKFHEKHHSHRGY', 'IFGSLFSLGSKLLPTVFKLFSRKKQ', 'MNNTIKDFDLDLKTNKKDTATPYVGSRYLCTPGSCWKLVCFTTTVK', 'CLGVGSCNDFAGCGYAIVCFW', 'GVLGTVKDLLIGAGKSAAQSTLKTLSCKISNDC', 'EKYTEVPEYI', 'VKCAVKDTYSCFIVRGKCRHECHDFEKPIGFCTKLNANCYM', 'APKGVQGPNG', 'PAQPFRIKKRQGPFERP', 'GTVPCGESCVFIPCITGIAGCSCKNKVCYIN', 'RCVCTRGFCRCVCTRGFC', 'AQCGAQGGGATCPGGLCCSQWGWCGSTPKYCGAGCQSNCR', 'GLMSTLKDFGKTAAKEIAQSLLSTASCKLAKTC', 'GLWNSIKIAGKKLFVNVLDKIRCKVAGGC', 'KTCENLSGTFKGPCIPDGNCNKHCRNNEHLLSGRCRDDFRCWCTNRC', 'GLFTKFAGKGIKDLIFKGVKHIGKEVGMDVIRVGIDVAGCKIKGVC', 'GFLGPLLKLGLKGAAKLLPQLLPSRQQ', 'KNLRRIIRKGIHIIKKYG', 'ATCDLLSGFGVGDSACAAHCIARGNRGGYCNSKKVCVCRN', 'RWKFFKKIEKVGQNIRDGIIKAGPAVAVVGQAASIT', 'SLNVMRKGIRKQPVSSGKRGGVNDYDM', 'RLCPRVRIRVCR', 'SVFAFENEQSSTIAPARLYK', 'LLKKLLKWLKK', 'AVNIPFKVHFRCKAAFC', 'GRSKKLGKKIEKAGKRVFNAAQKGLPVAAGVQAL', 'SIGFDGLNDPDIVAR', 'CAETCVVLPCFIVPGCSCKSSVCYFN', 'GVGDIFRKIVSTIKNVV', 'GIPCAESCVWIPCTVTALLGCSCSNNVCYN', 'GLLDSLKNLAINAAKGAGQSVLNTLSCKLSKTC', 'CLGIGSCNNFAGCGYAVVCFW', 'GLLDTLKNMAINAAKGAGQSVLNTLSCKLSKTC', 'ILSAIWSGIKSLF', 'YAFGYPS', 'VTCFCRRRGCASRERLIGYCRFGNTIYGLCCRR', 'RRCICTTRTCRFPYRRLGTCLFQNRVYTFCC', 'LRDLVCYCRTRGCKRREHMNGTCRKGHLMYTLCCR', 'KCWNLRGSCREKCIKNEKLYIFCTSGKLCCLKPKFQPNMLQR', 'HFLGTLVNLAKKIL', 'DKLIGSCVWGAVNYTSNCNAECKRRGYKGGHCGSFANVNCWCER', 'WNPFKELERAGQRVRDAVISAAAVATVGQAAAIARGG', 'GKNGVFKTISHECHLNTWAFLATCCS', 'YCNRRTGKCQRM', 'LE', 'GLFPKFNKKKVKTGIFDIIKTVGKEAGMDVLRTGIDVIGCKIKGEC', 'VFIDILDKMENAIHKAAQAGIGIAKPIEKMILPK', 'GLWDSIKNFGKTIALNVMDKIKCKIGGGCPP', 'FLPILASLAAKLGPKLFCLVTKKC', 'FFPIVGKLLFGLSGLL', 'RDWERREFERRQNELRREQEQRREELL', 'GLLDTLKNMAINAAKDAGVSVLNTLSCKLSKTC', 'HRHQGPIFDTRPSPFNPNQPRPGPIY', 'MWGRILAFVAKYGTKAVQWAWKNKWFLLSLGEAVFDYIRSIWGG', 'ILGPVLGLVGNALGGLIKKI', 'GCLEFWWKCNPNDDKCCRPKLKCSKLFKLCNFSF', 'QLGDVLQKAGEKIVRGLKNIGQRIKDFFGKLTPRTES', 'ASGWVCTLTIECGTLVCAC', 'LIKIVPAMICAVTKKC', 'LLEL', 'GIPCGESCVFIPCITSVAGCSCKSKVCYRN', 'LLKWLKKWLKK', 'KYYGNGVHCGKKTCYVDWGQATASIGKIIVNGWTQHGPWAHR', 'VFQFLGRIIHHVGNFVHGFSHVF', 'RRSRKNGIGYAIGYAFGAVERAVLGGSRDYNK', 'GLLDAIKDTAQNLFANVLDKIKCKFTKC', 'GLGSFLKNAIKIAGKVGSTIGKVADAIGNKE', 'KTCEHLADTYRGVCFTNASCDDHCKNKAHLISGTCHNWKCFCTQNC', 'FLGGLIKIVPAMICAVTKK', 'VCSCRLVFCRRTELRVGNCLIGGVSFTYCCTRVD', 'GTACGESCYVLPCFTVGCTCTSSQCFKN', 'GKKLFVNVLDKIRCKVAGGC', 'GIFSLIKGAAKLITKTVAKEAGKTGLELMACKVTNQC', 'VIPFVASVAAEMMPHVYCAASRKC', 'RYCERSSGTWSGVCGNTDKCSSQCQRLEGAAHGSCNYVFPAHKCICYYPC', 'GLLLDTLKGAAKDIAGIALEKLKCKITGCKP', 'ILKKWPWWPWRRK', 'RIITCSCRTFCFLGERISGRCYQSVFIYRLCCRG', 'INWKKIASIGKEVL', 'GLLSRLRDFLSDRGRRLGEKIERIGQKIKDLSEFFQS', 'KSYGNGVQCNKKKCWVDWGSAISTIGNNSAANWATGGAAGWKS', 'GLFGRLRDSLQRGGQKILEKAERIWCKIKDIFRG', 'KWKLFKKIGIGAVLKVLT', 'LDEPNMDTISKSREYKCKIDLDCSNHIACRHCSYRNCKCDHGTCKCMP', 'KTCENLADTFRGPCFATSNCDDHCKNKEHLLSGRCRDDFRCWCTRNC', 'ADDKNPLEEAFREADYEVFLEIAKNGL', 'QFTNVSCTTSKECWSVCQRLHNTSRGKCMNKKCRCYS', 'GVLDAFRKIATVVKNVV', 'FDIIKKVASVVG', 'KWKWKW', 'RFIPPILRPPVRPPFRPPFRPPFRPPPIIRFFGG', 'KQQLATEAESAGPIL', 'EFKRCWKGQGACRTYCTRQETYMHLCPDASLCCLSYALKPPPVPKHEYE', 'KGRGKQGGKVRAKAKTRSS', 'FFPIVGKLLSGLF', 'DKLIGSCVWGAVNYTSNCRAECKRRGYKGGHCGSFLNVNCWCET', 'EQCGRQAGGATCPNNLCCSQYGY', 'KWKLFKKIEKVGQGIGAVLKVLTTGL', 'KIKWFKTMKSLAKFLAKEQMKKHLGE', 'ATCRKPSMYFSGACFSDTNCQKACNREDWPNGKCLVGFKCECQRPC', 'GILDIAKKLVGGIRNVLGI', 'WYVKKCLNDVGICKKKCKPEEMHVKNGWAMCGKGRDCCVPAD', 'LLPILGNLLNGLL', 'AGIGKIGDFIKKAIAKYKN', 'GLFSKFSGKGIKNFLIKGVKHIGKEVGMDVIRTGIDVAGCKIKGEC', 'RFPWWWPFLR', 'SYVGDCGSNGGSCVSSYCPYGNRLNYFCPLGRTCCRHAYV', 'GLFSKFAGKGIKNLIFKGVKHIGKEVGMDVIRTGIDVAGCKIKGEC', 'RCYTNDDCKDGQPCPVPLACLFGSCICPWKSQSKLPICQIICANLD', 'ENCGRQAG', 'LDSLSFSYNNFEEDD', 'AVKDTYSCFIMRGKCRHECHDFEKPIGFCTKLNANCYM', 'ANLDAIIKIQAWARMWAARRQYL', 'KFFRKLKKSVKKRAKEFFKKPRVIGVSIPF', 'GSVFNCGETCVLGTCYTPGCTCNTYRVCTKD', 'KLLKKLLKWLK', 'FLPIIAGMAAKVICAITKKC', 'GGLRSLGRKILRAWKKYG', 'SLGSFMKGVGKGLATVGKIVADQFGKLLEA', 'INWLKLGKKMMSAI', 'MKVFFLFAVLFCLVRRNSVHISHQEARGP', 'KAGLAFPVGRVHRLLRK', 'FTIAEPYIHPCMKGFCSFKSECANKCIFMGHHKGGDCIGGLDGIYCCCLA', 'WFRKQLKW', 'LLSLVPHAINAVSAIAKHF', 'YSRCQLQGFNCVVRSYGLPTIPCCRGLTCRSYFPGSTYGRCQRF', 'FLPLLLSALPSFLCLVFKKC', 'GVLDAFRKIATVVKNLV', 'IFGSLFSLGSKLLPSVFKLFSRKKQ', 'GRFRRLRKKTRKRLKKIGKVLKWIPPIVGSIPLGC', 'RRWFWR', 'GLPCGESCVFIPCITTVVGCSCKNKVCYND', 'DYDWSLRGPPKCATYGQKCRTWSPPNCCWNLRCKAFRCRPR', 'GVFTLIKGATQLIGKTLGKEVGKTGLELMACKITKQC', 'EKCLRWQWRMRKYGG', 'ACYCRIPACLAGERRYGTCFYLGRVWAFCC', 'QCMQLETSGQMRRCVSQCDKRFEEDIDWSKYDNQE', 'GPIQISYNYNYGPCGRYCGILGVSPGDNLDCGNQR', 'GLLSGVLGVGKKIVCGLSGLC', 'SPKKTKPVKPKKVA', 'GLWSKIKEAAKTAGLMAMGFVNDMV', 'SGKRWWRRKK', 'QQCGRQASGRLCGNRLCCSQWGYCGSTASYCGAGCQSQCRS', 'GNPKVAHCASQIGRSTAWGAVSGA', 'RWKRWWRRKK', 'SIGSALKKALPVAKKIGKIALPIAKAALP', 'SISCGETCTTFNCWIPNCKCNHHDKVCYWN', 'GGLKKLGKKLEGVGKRVFKASEKALPVLTGYKAIG', 'GYGCPFNQYQCHSHCSGIRGYKGGYCKGTFKQTCKCY', 'DKLIGSCVWGAVNYTRNCNAECKRRGYKGGHCGSFANVNCWCET', 'GLFLDTLKGLAGKLLQGLKCIKAGCKP', 'YSKSLPLSVLNP', 'GLPVCGETCTLGKCYTAGCSCSWPVCYRN', 'MSKLVQAISDAVQAQQNQDWAKLGTSIVGIVENGVGILGKLFGF', 'QVFTLIKGATQLIRKTLGEQ', 'SGKLWWRRKK', 'WKSESLCTPGCVTGALQTCFLQTLTCNCKISK', 'FLGALWNVAKSVF', 'SLSRFLSFLKIVYPPAF', 'FIMDLLGKIF', 'KIPCGESCVWIPCVTSIFNCKCKENKVCYHD', 'DKLIGSCVWLAVNYTSNCNAECKRRGYKGGHCGSFLNVNCWCET', 'FLPILGKLLSGLL', 'SVPTSVYTLGIKILWSAYKHRKTIEKSFNKGFYH']\n" ] } ], "source": [ "Indneg_seq = []\n", "Indneg_id= []\n", "\n", "for Indseq_record in SeqIO.parse(\"/content/drive/MyDrive/Briefings in Bioinformatics/Sequence/Sequence2/neg_test_main.fasta\", \"fasta\"):\n", " Indneg_seq.append(str(Indseq_record.seq))\n", " Indneg_id.append(str(Indseq_record.id))\n", "Indpos_seq = []\n", "Indpos_id= []\n", "\n", "for Indseq_record in SeqIO.parse(\"/content/drive/MyDrive/Briefings in Bioinformatics/Sequence/Sequence2/pos_test_main.fasta\", \"fasta\"):\n", " Indpos_seq.append(str(Indseq_record.seq))\n", " Indpos_id.append(str(Indseq_record.id))\n", "\n", "Indseqs=Indpos_seq + Indneg_seq\n", "Inddfclass = pd.DataFrame({'class' : np.repeat((1,0), (172, 172))})\n", "z=Inddfclass['class']\n", "print(Indseqs)" ] }, { "cell_type": "code", "source": [ "pip install keras-tuner --upgrade\n" ], "metadata": { "id": "cknEu4TtiWc_", "colab": { "base_uri": "https://localhost:8080/" }, "outputId": "d7aee187-0516-48a4-8d12-8c1220d1900c" }, "execution_count": 6, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n", "Requirement already satisfied: keras-tuner in /usr/local/lib/python3.7/dist-packages (1.1.2)\n", "Requirement already satisfied: numpy in /usr/local/lib/python3.7/dist-packages (from keras-tuner) (1.21.6)\n", "Requirement already satisfied: ipython in /usr/local/lib/python3.7/dist-packages (from keras-tuner) (5.5.0)\n", "Requirement already satisfied: requests in /usr/local/lib/python3.7/dist-packages (from keras-tuner) (2.23.0)\n", "Requirement already satisfied: packaging in /usr/local/lib/python3.7/dist-packages (from keras-tuner) (21.3)\n", "Requirement already satisfied: tensorboard in /usr/local/lib/python3.7/dist-packages (from keras-tuner) (2.8.0)\n", "Requirement already satisfied: kt-legacy in /usr/local/lib/python3.7/dist-packages (from keras-tuner) (1.0.4)\n", "Requirement already satisfied: pexpect in /usr/local/lib/python3.7/dist-packages (from ipython->keras-tuner) (4.8.0)\n", "Requirement already satisfied: prompt-toolkit<2.0.0,>=1.0.4 in /usr/local/lib/python3.7/dist-packages (from ipython->keras-tuner) (1.0.18)\n", "Requirement already satisfied: pygments in /usr/local/lib/python3.7/dist-packages (from ipython->keras-tuner) (2.6.1)\n", "Requirement already satisfied: pickleshare in /usr/local/lib/python3.7/dist-packages (from ipython->keras-tuner) (0.7.5)\n", "Requirement already satisfied: simplegeneric>0.8 in /usr/local/lib/python3.7/dist-packages (from ipython->keras-tuner) (0.8.1)\n", "Requirement already satisfied: traitlets>=4.2 in /usr/local/lib/python3.7/dist-packages (from ipython->keras-tuner) (5.1.1)\n", "Requirement already satisfied: decorator in /usr/local/lib/python3.7/dist-packages (from ipython->keras-tuner) (4.4.2)\n", "Requirement already satisfied: setuptools>=18.5 in /usr/local/lib/python3.7/dist-packages (from ipython->keras-tuner) (57.4.0)\n", "Requirement already satisfied: wcwidth in /usr/local/lib/python3.7/dist-packages (from prompt-toolkit<2.0.0,>=1.0.4->ipython->keras-tuner) (0.2.5)\n", "Requirement already satisfied: six>=1.9.0 in /usr/local/lib/python3.7/dist-packages (from prompt-toolkit<2.0.0,>=1.0.4->ipython->keras-tuner) (1.15.0)\n", "Requirement already satisfied: pyparsing!=3.0.5,>=2.0.2 in /usr/local/lib/python3.7/dist-packages (from packaging->keras-tuner) (3.0.9)\n", "Requirement already satisfied: ptyprocess>=0.5 in /usr/local/lib/python3.7/dist-packages (from pexpect->ipython->keras-tuner) (0.7.0)\n", "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /usr/local/lib/python3.7/dist-packages (from requests->keras-tuner) (1.24.3)\n", "Requirement already satisfied: chardet<4,>=3.0.2 in /usr/local/lib/python3.7/dist-packages (from requests->keras-tuner) (3.0.4)\n", "Requirement already satisfied: idna<3,>=2.5 in /usr/local/lib/python3.7/dist-packages (from requests->keras-tuner) (2.10)\n", "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.7/dist-packages (from requests->keras-tuner) (2022.6.15)\n", "Requirement already satisfied: absl-py>=0.4 in /usr/local/lib/python3.7/dist-packages (from tensorboard->keras-tuner) (1.1.0)\n", "Requirement already satisfied: google-auth<3,>=1.6.3 in /usr/local/lib/python3.7/dist-packages (from tensorboard->keras-tuner) (1.35.0)\n", "Requirement already satisfied: werkzeug>=0.11.15 in /usr/local/lib/python3.7/dist-packages (from tensorboard->keras-tuner) (1.0.1)\n", "Requirement already satisfied: tensorboard-data-server<0.7.0,>=0.6.0 in /usr/local/lib/python3.7/dist-packages (from tensorboard->keras-tuner) (0.6.1)\n", "Requirement already satisfied: wheel>=0.26 in /usr/local/lib/python3.7/dist-packages (from tensorboard->keras-tuner) (0.37.1)\n", "Requirement already satisfied: markdown>=2.6.8 in /usr/local/lib/python3.7/dist-packages (from tensorboard->keras-tuner) (3.3.7)\n", "Requirement already satisfied: google-auth-oauthlib<0.5,>=0.4.1 in /usr/local/lib/python3.7/dist-packages (from tensorboard->keras-tuner) (0.4.6)\n", "Requirement already satisfied: grpcio>=1.24.3 in /usr/local/lib/python3.7/dist-packages (from tensorboard->keras-tuner) (1.46.3)\n", "Requirement already satisfied: tensorboard-plugin-wit>=1.6.0 in /usr/local/lib/python3.7/dist-packages (from tensorboard->keras-tuner) (1.8.1)\n", "Requirement already satisfied: protobuf>=3.6.0 in /usr/local/lib/python3.7/dist-packages (from tensorboard->keras-tuner) (3.17.3)\n", "Requirement already satisfied: rsa<5,>=3.1.4 in /usr/local/lib/python3.7/dist-packages (from google-auth<3,>=1.6.3->tensorboard->keras-tuner) (4.8)\n", "Requirement already satisfied: pyasn1-modules>=0.2.1 in /usr/local/lib/python3.7/dist-packages (from google-auth<3,>=1.6.3->tensorboard->keras-tuner) (0.2.8)\n", "Requirement already satisfied: cachetools<5.0,>=2.0.0 in /usr/local/lib/python3.7/dist-packages (from google-auth<3,>=1.6.3->tensorboard->keras-tuner) (4.2.4)\n", "Requirement already satisfied: requests-oauthlib>=0.7.0 in /usr/local/lib/python3.7/dist-packages (from google-auth-oauthlib<0.5,>=0.4.1->tensorboard->keras-tuner) (1.3.1)\n", "Requirement already satisfied: importlib-metadata>=4.4 in /usr/local/lib/python3.7/dist-packages (from markdown>=2.6.8->tensorboard->keras-tuner) (4.11.4)\n", "Requirement already satisfied: typing-extensions>=3.6.4 in /usr/local/lib/python3.7/dist-packages (from importlib-metadata>=4.4->markdown>=2.6.8->tensorboard->keras-tuner) (4.1.1)\n", "Requirement already satisfied: zipp>=0.5 in /usr/local/lib/python3.7/dist-packages (from importlib-metadata>=4.4->markdown>=2.6.8->tensorboard->keras-tuner) (3.8.0)\n", "Requirement already satisfied: pyasn1<0.5.0,>=0.4.6 in /usr/local/lib/python3.7/dist-packages (from pyasn1-modules>=0.2.1->google-auth<3,>=1.6.3->tensorboard->keras-tuner) (0.4.8)\n", "Requirement already satisfied: oauthlib>=3.0.0 in /usr/local/lib/python3.7/dist-packages (from requests-oauthlib>=0.7.0->google-auth-oauthlib<0.5,>=0.4.1->tensorboard->keras-tuner) (3.2.0)\n" ] } ] }, { "cell_type": "code", "source": [ "import keras_tuner as kt" ], "metadata": { "id": "FrSo7VXcxfvR" }, "execution_count": 7, "outputs": [] }, { "cell_type": "code", "source": [ "max_words = 5000\n", "max_len = 350\n", "tok = Tokenizer(num_words=max_words)\n", "tok.fit_on_texts(seqs)\n", "sequences = tok.texts_to_sequences(seqs)\n", "sequences_matrix = sequence.pad_sequences(sequences,maxlen=max_len)" ], "metadata": { "id": "chro7Rdnyr7T" }, "execution_count": 8, "outputs": [] }, { "cell_type": "code", "source": [ "#Independent Testing\n", "max_words = 5000\n", "max_len = 350\n", "indtok = Tokenizer(num_words=max_words)\n", "indtok.fit_on_texts(Indseqs)\n", "Indsequences = indtok.texts_to_sequences(Indseqs)\n", "Indsequences_matrix = sequence.pad_sequences(Indsequences,maxlen=max_len)\n", "X_train=sequences_matrix\n", "y_train=y\n", "X_test=Indsequences_matrix\n", "y_test=z" ], "metadata": { "id": "bgBHgrB-NWKW" }, "execution_count": 9, "outputs": [] }, { "cell_type": "code", "source": [ "import keras_tuner as kt\n", "from tensorflow import keras" ], "metadata": { "id": "8AUGdzyDirTJ" }, "execution_count": 10, "outputs": [] }, { "cell_type": "code", "source": [ "def build_model(hp):\n", " model = keras.Sequential()\n", " model.add(keras.layers.Dense(hp.Choice('units', [2, 4, 8, 16, 32, 64, 128]),activation='relu'))\n", " model.add(keras.layers.Dense(1, activation='sigmoid'))\n", " model.compile(loss='binary_crossentropy',metrics=['accuracy']) \n", " return model" ], "metadata": { "id": "gRK1QxEkjhN-" }, "execution_count": 11, "outputs": [] }, { "cell_type": "code", "source": [ "tuner1 = kt.RandomSearch(\n", " build_model,\n", " overwrite=True,\n", " objective='val_accuracy',\n", " max_trials=10)" ], "metadata": { "id": "_EeqLMhBjhQi" }, "execution_count": 12, "outputs": [] }, { "cell_type": "code", "source": [ "tuner1.search(X_train, y_train, epochs=20, validation_data=(X_test, y_test))\n", "best_model = tuner1.get_best_models()[0]" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "xkZgo6uDjhdK", "outputId": "a37a48ee-bbd7-4513-a3cf-c1cec5001c24" }, "execution_count": 13, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Trial 5 Complete [00h 00m 08s]\n", "val_accuracy: 0.9389534592628479\n", "\n", "Best val_accuracy So Far: 0.9912790656089783\n", "Total elapsed time: 00h 00m 34s\n", "INFO:tensorflow:Oracle triggered exit\n" ] } ] }, { "cell_type": "code", "source": [ "tuner1.results_summary()" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "ZuENDraMC3sh", "outputId": "8668997d-a660-46cf-b4ef-d2779ce3b720" }, "execution_count": 14, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Results summary\n", "Results in ./untitled_project\n", "Showing 10 best trials\n", "\n", "Trial summary\n", "Hyperparameters:\n", "units: 32\n", "Score: 0.9912790656089783\n", "Trial summary\n", "Hyperparameters:\n", "units: 64\n", "Score: 0.9883720874786377\n", "Trial summary\n", "Hyperparameters:\n", "units: 8\n", "Score: 0.9767441749572754\n", "Trial summary\n", "Hyperparameters:\n", "units: 128\n", "Score: 0.9389534592628479\n", "Trial summary\n", "Hyperparameters:\n", "units: 2\n", "Score: 0.5\n" ] } ] }, { "cell_type": "code", "source": [ "best_model.build(X_train.shape)\n", "best_model.summary()" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "G2R_hisVCCGl", "outputId": "49fdd81c-899e-45cb-e578-67576e2baeda" }, "execution_count": 15, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Model: \"sequential\"\n", "_________________________________________________________________\n", " Layer (type) Output Shape Param # \n", "=================================================================\n", " dense (Dense) (1378, 32) 11232 \n", " \n", " dense_1 (Dense) (1378, 1) 33 \n", " \n", "=================================================================\n", "Total params: 11,265\n", "Trainable params: 11,265\n", "Non-trainable params: 0\n", "_________________________________________________________________\n" ] } ] }, { "cell_type": "code", "source": [ "accr = best_model.evaluate(X_test,y_test)\n", "print('Test set\\n Loss: {:0.3f}\\n Accuracy: {:0.3f}'.format(accr[0],accr[1]))" ], "metadata": { "id": "mu_n3V0Xjhft", "colab": { "base_uri": "https://localhost:8080/" }, "outputId": "96cff5ee-f9db-4801-da50-4a8051acd8bd" }, "execution_count": 16, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "11/11 [==============================] - 0s 2ms/step - loss: 0.3481 - accuracy: 0.9913\n", "Test set\n", " Loss: 0.348\n", " Accuracy: 0.991\n" ] } ] }, { "cell_type": "code", "source": [ "pred=best_model.predict(X_test)\n", "pred1 = np.round_(pred)\n", "\n", "from sklearn.metrics import matthews_corrcoef as mcc\n", "mc=mcc(y_test, pred1)\n", "print(\"MCC: \",mc)\n", "from sklearn.metrics import confusion_matrix as cm\n", "cm(y_test, pred1)" ], "metadata": { "id": "KIAmIGewjhi_", "colab": { "base_uri": "https://localhost:8080/" }, "outputId": "301ecf3a-e47d-4830-8780-ef29ac9cb360" }, "execution_count": 17, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "MCC: 0.9827076298239907\n" ] }, { "output_type": "execute_result", "data": { "text/plain": [ "array([[172, 0],\n", " [ 3, 169]])" ] }, "metadata": {}, "execution_count": 17 } ] }, { "cell_type": "code", "source": [ "from sklearn.metrics import matthews_corrcoef as mcc\n", "mc=mcc(y_test, pred1)\n", "print(\"MCC: \",mc)\n", "from sklearn.metrics import confusion_matrix as cm\n", "cm(y_test, pred1)\n", "print(classification_report(y_test, pred1))\n", "tp, fn, fp, tn = confusion_matrix(y_test, pred1).ravel()\n", "print(\"MCC ---> {0}\".format(mc))\n", "print(\"Confusion Matrix. tn, fp, fn, tp ---> \", tp, fn, fp, tn)\n", "print(\"Precision --->TP/TP+Fp \", tp/(tp+fp))\n", "print(\"Recall - SN - Sensitivity --->TP/TP+FN \", tp/(tp+fn))\n", "print(\"Specificity - SP ---> \", tn/(tn+fp))\n", "print(\"Balanced Accuracy ---> \", ((tp/(tp+fn))+(tn/(tn+fp)))/2)\n", "print(\"Jaccard Index --->TP/TP+FN+FP \", tp/(tp+fn+fp))" ], "metadata": { "id": "RG-JsifKTmxp", "colab": { "base_uri": "https://localhost:8080/" }, "outputId": "5a8cbe62-a934-4e36-f333-552a8e339c9d" }, "execution_count": 18, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "MCC: 0.9827076298239907\n", " precision recall f1-score support\n", "\n", " 0 0.98 1.00 0.99 172\n", " 1 1.00 0.98 0.99 172\n", "\n", " accuracy 0.99 344\n", " macro avg 0.99 0.99 0.99 344\n", "weighted avg 0.99 0.99 0.99 344\n", "\n", "MCC ---> 0.9827076298239907\n", "Confusion Matrix. tn, fp, fn, tp ---> 172 0 3 169\n", "Precision --->TP/TP+Fp 0.9828571428571429\n", "Recall - SN - Sensitivity --->TP/TP+FN 1.0\n", "Specificity - SP ---> 0.9825581395348837\n", "Balanced Accuracy ---> 0.9912790697674418\n", "Jaccard Index --->TP/TP+FN+FP 0.9828571428571429\n" ] } ] }, { "cell_type": "code", "source": [ "from sklearn import metrics\n", "import matplotlib.pyplot as plt\n", "from sklearn.metrics import RocCurveDisplay\n", "fpr, tpr, _ = metrics.roc_curve(y_test, pred1)\n", "auc = metrics.roc_auc_score(y_test, pred1)\n", "\n", "#create ROC curve\n", "plt.plot(fpr,tpr)\n", "plt.plot(fpr,tpr,label=\"AUC=\"+str(auc))\n", "plt.ylabel('True Positive Rate')\n", "plt.xlabel('False Positive Rate')\n", "plt.legend(loc=4)\n", "plt.show()" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 279 }, "id": "icVoSPCr3dxD", "outputId": "9021008e-5713-4bc6-f170-c3816f122eef" }, "execution_count": 19, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "
" ], "image/png": "iVBORw0KGgoAAAANSUhEUgAAAYIAAAEGCAYAAABo25JHAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADh0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uMy4yLjIsIGh0dHA6Ly9tYXRwbG90bGliLm9yZy+WH4yJAAAgAElEQVR4nO3dfZgU1Zn38e/dMyCKIgbQjYwDiEMcB2HE0ZFIQMQQfMOsIogxYtYsxkiM4rqQ4KNGd5ONbmI0IUZBo2YjiK4vJAK6CkRNYgSjiEBAFJAhMQIiBlGc6b6fP6q66XnvAarHmfp9rquvrjp1uuqu7plz16nTXWXujoiIxFeitQMQEZHWpUQgIhJzSgQiIjGnRCAiEnNKBCIiMVfY2gG0VPfu3b13796tHYaISJvy8ssvb3H3Hg0ta3OJoHfv3ixdurS1wxARaVPMbENjy3RqSEQk5pQIRERiTolARCTmlAhERGJOiUBEJOYiSwRmdq+ZvWtmrzey3MzsDjNba2avmdmgqGIREZHGRdkjuA8Y1cTy04GS8DERuDPCWEREpBGR/Y7A3Z8zs95NVDkHeMCD62C/aGZdzeyz7v63qGISEQHwVIpUKkUyWUMqWUMqlSSZTJJKJkkla0gma/BUMlyexFPpeh5OB/U8lfWcSuJhXfdUMO01eDJFKpWEVFAv+2Geykzj4XNmOoWlkrgnwYPpzww6h36Dhu3z96M1f1DWE9iYNV8VltVLBGY2kaDXQHFxcV6CE2lNdRuqZLKGZDKJh9Op1O5GK5VK7W6oksnMskyDlaqBZJJUunFKZTVcqWCdeJJUMoV7DaSyGqesRqqhaXMPGqqscjyJpcLGK2zEMtNh45cuN989b6TC6ez5JImwLEEyfE7tfiZFIlyWCMvqPTxFQdZ8ASkKzCkAClr7g26hP3X5LLSzRJAzd78buBugoqJCd9L5FPCwkUofMdVtqDxseDKNU7KGVCosT+1usNINEukGLBUcQXm9o6caPOVBQ5UMy7Ibp+xGylN1Gq1Ug41U7YaqduOV3UDhXqthSpcnPFW7scpqoIL5ZGY6kdVgGV6rUUovL8gua4MNVcoze5x5Tlkw7UGTvXsPbffyFAk8LHOMlBUE75AlcCsgZYWkEsG0h2WO4VYAVqc8XZYoACsAbPd0dnnmOQFWgFkiKAvLLZzOPGfKElhYbonCrOlwviBBIlGIhfUSBUGdRKKAREFBsCx8DpYZiYJCCsLygoJCrKCQgnA6kX4OX18Z0WfXmolgE3BE1nxRWBaZHR9so+aTXZmGKpk5ikplGifPPGc1VJku4O6jqUy3L+VZDVWdRimrISPsAmYapKyGLN3ty+4C1m6cah89kWmMGj+ySmTXyTRMYXmtxim5+1/UPftfePe/bZ2GKoGTMKeQNnIkEUpmNVSpOg1VveNI291gOZZpqFIk8HCZW1gv0ZGasHx3Q1W7gcpusGo1SNnL6zZSltjdUDXQSJHdOKWnCwowKyRREL4uqyEK5oOGKhHWDRqkoBELGqoCLJHINFSJgoLdz4n6DZUlEhQUFIaNVUJfQ2yjWvP/eC4wycxmA5XA9ijHB15+cibHL7kmqtXvEzWe6ezuPqoKG51knUYqOMJKN1Tp8rBxChuh4NlIWbqhSjde6QYo6ygqPMLy8Mgou/FKNzpBmWUdTQVHSh42HpmyRNiI1Tmyyn6QbozSR061jqp2z6ePqCxzRFWQaZzSjVdBWCc4gko3Trvn041UQSLRpo6wRfIlskRgZrOAU4DuZlYF3AB0AHD3XwDzgDOAtcBO4GtRxQJQ/d7bALx41FVYh/0zjVS9LmAi3U0MGiorSGAWNE7phipRsLteputXUPfIKjgqS3f7CI+cEpnuXkGmkUp3AdvS0bWItB9RfmtofDPLHbgiqu03ZsCXJ3PAgQfne7MiIp9aOqUnIhJzSgQiIjGnRCAiEnNKBCIiMadEICISc0oEIiIxp0QgIhJzSgQiIjGnRCAiEnNKBCIiMadEICISc0oEIiIxp0QgIhJzSgQiIjGnRCAiEnNKBCIiMadEICISc0oEIiIxp0QgIhJzSgQiIjGnRCAiEnNKBCIiMadEICISc0oEIiIxp0QgIhJzSgQiIjGnRCAiEnNKBCIiMadEICISc0oEIiIxp0QgIhJzkSYCMxtlZqvNbK2ZTW1gebGZLTKzV8zsNTM7I8p4RESkvsgSgZkVANOB04FjgPFmdkydatcBc9z9OOAC4OdRxSMiIg2LskdwIrDW3d9y90+A2cA5deo40CWcPhj4a4TxiIhIA6JMBD2BjVnzVWFZthuBi8ysCpgHfKuhFZnZRDNbamZLN2/eHEWsIiKx1dqDxeOB+9y9CDgD+JWZ1YvJ3e929wp3r+jRo0fegxQRac+iTASbgCOy5ovCsmyXAnMA3P2PQCege4QxiYhIHVEmgiVAiZn1MbOOBIPBc+vUeRsYAWBmpQSJQOd+RETyKLJE4O41wCTgKWAVwbeDVpjZTWY2Oqx2DfCvZrYMmAVc4u4eVUwiIlJfYZQrd/d5BIPA2WXXZ02vBE6OMgYREWlaaw8Wi4hIK1MiEBGJOSUCEZGYUyIQEYk5JQIRkZhTIhARiTklAhGRmFMiEBGJOSUCEZGYUyIQEYm5nBOBmR0QZSAiItI6mk0EZvZ5M1sJ/CWcH2hmuqWkiEg7kUuP4DbgS8BWAHdfBgyNMigREcmfnE4NufvGOkXJCGIREZFWkMtlqDea2ecBN7MOwLcJ7i8gIiLtQC49gm8AVxDceH4TUA58M8qgREQkf3LpEXzO3b+SXWBmJwO/jyYkERHJp1x6BD/NsUxERNqgRnsEZjYY+DzQw8wmZy3qAhREHZiIiORHU6eGOgIHhnUOyir/ABgTZVAiIpI/jSYCd/8d8Dszu8/dN+QxJhERyaNcBot3mtmtQBnQKV3o7qdGFpWIiORNLoPFvya4vEQf4HvAemBJhDGJiEge5ZIIurn7PUC1u//O3f8FUG9ARKSdyOXUUHX4/DczOxP4K/CZ6EISEZF8yiUR/IeZHQxcQ/D7gS7AVZFGJSIiedNsInD334aT24HhkPllsYiItANN/aCsABhLcI2hBe7+upmdBXwX2B84Lj8hiohIlJrqEdwDHAG8BNxhZn8FKoCp7v54PoITEZHoNZUIKoAB7p4ys07AO0Bfd9+an9BERCQfmvr66CfungJw94+Bt1qaBMxslJmtNrO1Zja1kTpjzWylma0wswdbsn4REdl7TfUIjjaz18JpA/qG8wa4uw9oasXhGMN04ItAFbDEzOa6+8qsOiXAd4CT3X2bmR26F/siIiJ7oKlEULqX6z4RWOvubwGY2WzgHGBlVp1/Baa7+zYAd393L7cpIiIt1NRF5/b2QnM9gex7HVcBlXXq9AMws98TXNr6RndfUHdFZjYRmAhQXFy8l2GJiEi2nG5eH6FCoAQ4BRgPzDCzrnUrufvd7l7h7hU9evTIc4giIu1blIlgE8HXT9OKwrJsVcBcd69293XAGoLEICIieZJTIjCz/c3scy1c9xKgxMz6mFlH4AJgbp06jxP0BjCz7gSnit5q4XZERGQvNJsIzOxs4FVgQThfbmZ1G/R63L0GmAQ8BawC5rj7CjO7ycxGh9WeAraa2UpgEXCtfqcgIpJfuVx07kaCbwAtBnD3V82sTy4rd/d5wLw6ZddnTTswOXyIiEgryOXUULW7b69T5lEEIyIi+ZdLj2CFmV0IFIQ/ALsS+EO0YYmISL7k0iP4FsH9incBDxJcjlr3IxARaSdy6REc7e7TgGlRByMiIvmXS4/gR2a2ysxuNrP+kUckIiJ51WwicPfhBHcm2wzcZWbLzey6yCMTEZG8yOkHZe7+jrvfAXyD4DcF1zfzEhERaSNy+UFZqZndaGbLCW5e/weCy0WIiEg7kMtg8b3AQ8CX3P2vEccjIiJ51mwicPfB+QhERERaR6OJwMzmuPvY8JRQ9i+Jc7pDmYiItA1N9Qi+HT6flY9ARESkdTQ6WOzufwsnv+nuG7IfwDfzE56IiEQtl6+PfrGBstP3dSAiItI6mhojuJzgyP9IM3sta9FBwO+jDkxERPKjqTGCB4H5wA+AqVnl/3D39yKNSkRE8qapRODuvt7Mrqi7wMw+o2QgItI+NNcjOAt4meDro5a1zIEjI4xLRETypNFE4O5nhc853ZZSRETaplyuNXSymXUOpy8ysx+bWXH0oYmISD7k8vXRO4GdZjYQuAZ4E/hVpFGJiEje5JIIatzdgXOAn7n7dIKvkIqISDuQy9VH/2Fm3wG+CnzBzBJAh2jDEhGRfMmlRzCO4Mb1/+Lu7xDci+DWSKMSEZG8yeVWle8AvwYONrOzgI/d/YHIIxMRkbzI5VtDY4GXgPOBscCfzGxM1IGJiEh+5DJGMA04wd3fBTCzHsAzwCNRBiYiIvmRyxhBIp0EQltzfJ2IiLQBufQIFpjZU8CscH4cMC+6kEREJJ9yuWfxtWZ2LjAkLLrb3R+LNiwREcmXpu5HUAL8N9AXWA78m7tvyldgIiKSH02d678X+C1wHsEVSH/a0pWb2SgzW21ma81sahP1zjMzN7OKlm5DRET2TlOnhg5y9xnh9Goz+3NLVmxmBcB0gltdVgFLzGyuu6+sU+8g4NvAn1qyfhER2TeaSgSdzOw4dt+HYP/seXdvLjGcCKx197cAzGw2wfWKVtapdzPwQ+DaFsYuIiL7QFOJ4G/Aj7Pm38mad+DUZtbdE9iYNV8FVGZXMLNBwBHu/qSZNZoIzGwiMBGguFhXwBYR2ZeaujHN8Cg3HF687sfAJc3Vdfe7gbsBKioqPMq4RETiJsofhm0CjsiaLwrL0g4C+gOLzWw9cBIwVwPGIiL5FWUiWAKUmFkfM+sIXADMTS909+3u3t3de7t7b+BFYLS7L40wJhERqSOyRODuNcAk4ClgFTDH3VeY2U1mNjqq7YqISMs0+8tiMzPgK8CR7n5TeL/if3L3l5p7rbvPo87lKNz9+kbqnpJTxCIisk/l0iP4OTAYGB/O/4Pg9wEiItIO5HLRuUp3H2RmrwC4+7bwnL+IiLQDufQIqsNfCTtk7keQijQqERHJm1wSwR3AY8ChZvafwAvA9yONSkRE8iaXy1D/2sxeBkYQXF7iy+6+KvLIREQkL3L51lAxsBP4TXaZu78dZWAiIpIfuQwWP0kwPmBAJ6APsBooizAuERHJk1xODR2bPR9eKO6bkUUkIiJ51eJfFoeXn65stqKIiLQJuYwRTM6aTQCDgL9GFpGIiORVLmMEB2VN1xCMGfxvNOGIiEi+NZkIwh+SHeTu/5aneEREJM8aHSMws0J3TwIn5zEeERHJs6Z6BC8RjAe8amZzgYeBD9ML3f3RiGMTEZE8yGWMoBOwleAexenfEzigRCAi0g40lQgODb8x9Dq7E0Ca7hssItJONJUICoADqZ0A0pQIRETaiaYSwd/c/aa8RSIiIq2iqV8WN9QTEBGRdqapRDAib1GIiEiraTQRuPt7+QxERERaR4svOiciIu2LEoGISMwpEYiIxJwSgYhIzCkRiIjEnBKBiEjMKRGIiMScEoGISMwpEYiIxFykicDMRpnZajNba2ZTG1g+2cxWmtlrZvasmfWKMh4REakvskQQ3u94OnA6cAww3syOqVPtFaDC3QcAjwC3RBWPiIg0LMoewYnAWnd/y90/AWYD52RXcPdF7r4znH0RKIowHhERaUCUiaAnsDFrviosa8ylwPyGFpjZRDNbamZLN2/evA9DFBGRT8VgsZldBFQAtza03N3vdvcKd6/o0aNHfoMTEWnncrl5/Z7aBByRNV8UltViZqcB04Bh7r4rwnhERKQBUfYIlgAlZtbHzDoCFwBzsyuY2XHAXcBod383wlhERKQRkSUCd68BJgFPAauAOe6+wsxuMrPRYbVbgQOBh83sVTOb28jqREQkIlGeGsLd5wHz6pRdnzV9WpTbFxGR5n0qBotFRKT1KBGIiMScEoGISMwpEYiIxJwSgYhIzCkRiIjEnBKBiEjMKRGIiMScEoGISMwpEYiIxJwSgYhIzCkRiIjEnBKBiEjMKRGIiMScEoGISMwpEYiIxJwSgYhIzCkRiIjEnBKBiEjMKRGIiMScEoGISMwVtnYAIp821dXVVFVV8fHHH7d2KCIt1qlTJ4qKiujQoUPOr1EiEKmjqqqKgw46iN69e2NmrR2OSM7cna1bt1JVVUWfPn1yfp1ODYnU8fHHH9OtWzclAWlzzIxu3bq1uDerRCDSACUBaav25G9XiUBEJOaUCEQ+pR5//HHMjL/85S8ALF68mLPOOqtWnUsuuYRHHnkECAa5p06dSklJCYMGDWLw4MHMnz8/p23t2rWLcePGcdRRR1FZWcn69esbrHf77bfTv39/ysrK+MlPfpIpX7ZsGYMHD+bYY4/l7LPP5oMPPgBg69atDB8+nAMPPJBJkyZl6u/cuZMzzzyTo48+mrKyMqZOnZpZdvXVV1NeXk55eTn9+vWja9eumWVTpkyhf//+9O/fn4ceeihTvm7dOiorKznqqKMYN24cn3zySWbZnDlzOOaYYygrK+PCCy9sdl1f+MIXMts//PDD+fKXv5xZtnjxYsrLyykrK2PYsGEArF69OlO/vLycLl261HpvAH70ox9hZmzZsqVW+ZIlSygsLMx8hgCjRo2ia9eu9T7rZ599lkGDBlFeXs6QIUNYu3Ztg5/RHnH3NvU4/vjjfU/88YH/535DF//wH+/v0eslPlauXNnaIbi7+9ixY33IkCF+/fXXu7v7okWL/Mwzz6xVZ8KECf7www+7u/uUKVP84osv9o8//tjd3d955x1/6KGHctrW9OnT/bLLLnN391mzZvnYsWPr1Vm+fLmXlZX5hx9+6NXV1T5ixAh/44033N29oqLCFy9e7O7u99xzj1933XXu7r5jxw5//vnn/c477/Qrrrgis64PP/zQFy5c6O7uu3bt8iFDhvi8efPqbfOOO+7wr33ta+7u/tvf/tZPO+00r66u9h07dnhFRYVv377d3d3PP/98nzVrlru7X3bZZf7zn//c3d3XrFnj5eXl/t5777m7+9///vdm15Xt3HPP9fvvv9/d3bdt2+alpaW+YcOGWuvKVlNT44cddpivX78+U/b222/7yJEjvbi42Ddv3lyr7vDhw/3000/PfIbu7s8884zPnTu33mddUlKS+ducPn26T5gwod720xr6GwaWeiPtqr41JNKU+VPhneX7dp3/dCyc/l9NVtmxYwcvvPACixYt4uyzz+Z73/tek/V37tzJjBkzWLduHfvttx8Ahx12GGPHjs0ppCeeeIIbb7wRgDFjxjBp0iTcvdb55lWrVlFZWckBBxwAwLBhw3j00Uf593//d9asWcPQoUMB+OIXv8iXvvQlbr75Zjp37tzg0esBBxzA8OHDAejYsSODBg2iqqqqXlyzZs3K7PvKlSsZOnQohYWFFBYWMmDAABYsWMD555/PwoULefDBBwGYMGECN954I5dffjkzZszgiiuu4JBDDgHg0EMPbXJd2e/XBx98wMKFC/nlL38JwIMPPsi5555LcXFxrXVle/bZZ+nbty+9evXKlF199dXccsstnHPOObXq/vSnP+W8885jyZIltcpHjBjB4sWL663bzDI9re3bt3P44YfXq7OndGpI5FPoiSeeYNSoUfTr149u3brx8ssvN1l/7dq1FBcX06VLlwaXjxs3rtbpi/TjgQceAGDTpk0cccQRABQWFnLwwQezdevWWuvo378/zz//PFu3bmXnzp3MmzePjRs3AlBWVsYTTzwBwMMPP5wpz8X777/Pb37zG0aMGFGrfMOGDaxbt45TTz0VgIEDB7JgwQJ27tzJli1bWLRoERs3bmTr1q107dqVwsLguLaoqIhNmzYBsGbNGtasWcPJJ5/MSSedxIIFC5pcV7bHH3+cESNGZN7TNWvWsG3bNk455RSOP/74zHuXbfbs2YwfPz4z/8QTT9CzZ08GDhxYq96mTZt47LHHuPzyy3N+n2bOnMkZZ5xBUVERv/rVr2qdTttb6hGINKWZI/eozJo1i29/+9sAXHDBBcyaNYuzzz67wbq5fEsk+xz4niotLWXKlCmMHDmSzp07U15eTkFBAQD33nsvV155JTfffDOjR4+mY8eOOa2zpqaG8ePHc+WVV3LkkUfWWjZ79mzGjBmT2cbIkSNZsmQJn//85+nRoweDBw/OLGtq/W+88QaLFy+mqqqKoUOHsnz58pzWNWvWLL7+9a/XWtfLL7/Ms88+y0cffcTgwYM56aST6NevHwCffPIJc+fO5Qc/+AEQ9NK+//3v8/TTT9eL66qrruKHP/whiUTux+K33XYb8+bNo7KykltvvZXJkyczc+bMnF/flEgTgZmNAm4HCoCZ7v5fdZbvBzwAHA9sBca5+/ooYxL5tHvvvfdYuHAhy5cvx8xIJpOYGRMmTGDbtm316nbv3p2jjjqKt99+mw8++KDBXsG4ceNYvXp1vfLJkydz8cUX07NnTzZu3EhRURE1NTVs376dbt261at/6aWXcumllwLw3e9+l6KiIgCOPvroTIO3Zs0annzyyZz2deLEiZSUlHDVVVfVWzZ79mymT59eq2zatGlMmzYNgAsvvDDTY3r//fepqamhsLCQqqoqevbsCQS9g8rKSjp06ECfPn3o168fb7zxBieccEKD60rbsmULL730Eo899limrKioiG7dutG5c2c6d+7M0KFDWbZsWeZ18+fPZ9CgQRx22GEAvPnmm6xbty7TG6iqqmLQoEG89NJLLF26lAsuuCCzrXnz5lFYWFhrYDrb5s2bWbZsGZWVlUDweY4aNSqn9zgnjQ0e7O2DoPF/EzgS6AgsA46pU+ebwC/C6QuAh5pbrwaLJWqtPVh81113+cSJE2uVDR061BcvXuy9e/fOxLd+/XovLi72998P/qavvfZav+SSS3zXrl3u7v7uu+/6nDlzctrmz372s1qDxeeff36D9dIDpBs2bPDPfe5zvm3btlrlyWTSv/rVr/o999xT63W//OUvaw0Wu7tPmzbNzz33XE8mk/W2s2rVKu/Vq5enUqlMWU1NjW/ZssXd3ZctW+ZlZWVeXV3t7u5jxoypNVg8ffp0d3efP3++X3zxxe7uvnnzZi8qKvItW7Y0uS539zvvvDPzurSVK1f6qaee6tXV1f7hhx96WVmZL1++PLN83Lhxfu+99zb4vrm79+rVq9ZgcVr2gH9a3S8GVFdXe7du3Xz16tXu7j5z5kw/99xzG91WSweLo0wEg4Gnsua/A3ynTp2ngMHhdCGwBbCm1qtEIFFr7URwyimn+Pz582uV3X777f6Nb3zDX3jhBa+srPSBAwd6RUWFP/3005k6u3bt8muvvdb79u3rZWVlfuKJJ/qCBQty2uZHH33kY8aM8b59+/oJJ5zgb775pru7b9q0yU8//fRMvSFDhnhpaakPGDDAn3nmmUz5T37yEy8pKfGSkhKfMmVKrQa8V69efsghh3jnzp29Z8+evmLFCt+4caMDfvTRR/vAgQN94MCBPmPGjMxrbrjhBp8yZUq9GEtLS720tNQrKyv9lVdeySx78803/YQTTvC+ffv6mDFjMt+cSqVSfvXVV3tpaan3798/kyyaWpe7+7Bhw+p9Bu7ut9xyi5eWlnpZWZnfdtttmfIdO3b4Zz7zmUxSbkiuiWDIkCHevXt379Spk/fs2TPzGT766KPev39/HzBggA8bNizzGTWkpYnAguX7npmNAUa5+9fD+a8Cle4+KavO62GdqnD+zbDOljrrmghMBCguLj5+w4YNLY7nlaf/B3/tIY65Yjad9u+8p7slMbBq1SpKS0tbOwyRPdbQ37CZvezuFQ3VbxODxe5+N3A3QEVFxR5lruNGXgQjL9qncYmItAdRfn10E3BE1nxRWNZgHTMrBA4mGDQWEZE8iTIRLAFKzKyPmXUkGAyeW6fOXGBCOD0GWOhRnasSaQH9GUpbtSd/u5ElAnevASYRDAivAua4+wozu8nMRofV7gG6mdlaYDKw734hIbKHOnXqxNatW5UMpM1xD+5H0KlTpxa9LrLB4qhUVFT40qVLWzsMacd0hzJpyxq7Q1mbHywWyaf0j49E4kLXGhIRiTklAhGRmFMiEBGJuTY3WGxmm4GW/7Q40J3gMhZxon2OB+1zPOzNPvdy9x4NLWhziWBvmNnSxkbN2yvtczxon+Mhqn3WqSERkZhTIhARibm4JYK7WzuAVqB9jgftczxEss+xGiMQEZH64tYjEBGROpQIRERirl0mAjMbZWarzWytmdW7oqmZ7WdmD4XL/2RmvfMf5b6Vwz5PNrOVZvaamT1rZr1aI859qbl9zqp3npm5mbX5rxrmss9mNjb8rFeY2YP5jnFfy+Fvu9jMFpnZK+Hf9xmtEee+Ymb3mtm74R0cG1puZnZH+H68ZmaD9nqjjd3Dsq0+gALgTeBIoCOwDDimTp1vAr8Ipy8AHmrtuPOwz8OBA8Lpy+Owz2G9g4DngBeBitaOOw+fcwnwCnBIOH9oa8edh32+G7g8nD4GWN/ace/lPg8FBgGvN7L8DGA+YMBJwJ/2dpvtsUdwIrDW3d9y90+A2cA5deqcA9wfTj8CjDAzy2OM+1qz++zui9x9Zzj7IsEd49qyXD5ngJuBHwLt4ZrSuezzvwLT3X0bgLu/m+cY97Vc9tmBLuH0wcBf8xjfPufuzwHvNVHlHOABD7wIdDWzz+7NNttjIugJbMyarwrLGqzjwQ10tgPd8hJdNHLZ52yXEhxRtGXN7nPYZT7C3Z/MZ2ARyuVz7gf0M7Pfm9mLZjYqb9FFI5d9vhG4yMyqgHnAt/ITWqtp6f97s3Q/gpgxs4uACmBYa8cSJTNLAD8GLmnlUPKtkOD00CkEvb7nzOxYd3+/VaOK1njgPnf/kZkNBn5lZv3dPdXagbUV7bFHsAk4Imu+KCxrsI6ZFRJ0J7fmJbpo5LLPmNlpwDRgtLvvylNsUWlunw8C+gOLzWw9wbnUuW18wDiXz7kKmOvu1e6+DlhDkBjaqlz2+VJgDoC7/xHoRHBxtvYqp//3lmiPiWAJUGJmfcysIxmsNEoAAAUaSURBVMFg8Nw6deYCE8LpMcBCD0dh2qhm99nMjgPuIkgCbf28MTSzz+6+3d27u3tvd+9NMC4y2t3b8n1Oc/nbfpygN4CZdSc4VfRWPoPcx3LZ57eBEQBmVkqQCDbnNcr8mgtcHH576CRgu7v/bW9W2O5ODbl7jZlNAp4i+MbBve6+wsxuApa6+1zgHoLu41qCQZkLWi/ivZfjPt8KHAg8HI6Lv+3uo1st6L2U4z63Kznu81PASDNbCSSBa929zfZ2c9zna4AZZnY1wcDxJW35wM7MZhEk8+7huMcNQAcAd/8FwTjIGcBaYCfwtb3eZht+v0REZB9oj6eGRESkBZQIRERiTolARCTmlAhERGJOiUBEJOaUCORTycySZvZq1qN3E3V37IPt3Wdm68Jt/Tn8hWpL1zHTzI4Jp79bZ9kf9jbGcD3p9+V1M/uNmXVtpn55W78ap0RPXx+VTyUz2+HuB+7ruk2s4z7gt+7+iJmNBP7b3Qfsxfr2Oqbm1mtm9wNr3P0/m6h/CcFVVyft61ik/VCPQNoEMzswvI/Cn81suZnVu9KomX3WzJ7LOmL+Qlg+0sz+GL72YTNrroF+DjgqfO3kcF2vm9lVYVlnM3vSzJaF5ePC8sVmVmFm/wXsH8bx63DZjvB5tpmdmRXzfWY2xswKzOxWM1sSXmP+shzelj8SXmzMzE4M9/EVM/uDmX0u/CXuTcC4MJZxYez3mtlLYd2GrtgqcdPa197WQ4+GHgS/in01fDxG8Cv4LuGy7gS/qkz3aHeEz9cA08LpAoLrDXUnaNg7h+VTgOsb2N59wJhw+nzgT8DxwHKgM8GvslcAxwHnATOyXntw+LyY8J4H6Ziy6qRj/Gfg/nC6I8FVJPcHJgLXheX7AUuBPg3EuSNr/x4GRoXzXYDCcPo04H/D6UuAn2W9/vvAReF0V4JrEXVu7c9bj9Z9tLtLTEi78ZG7l6dnzKwD8H0zGwqkCI6EDwPeyXrNEuDesO7j7v6qmQ0juFnJ78NLa3QkOJJuyK1mdh3BdWouJbh+zWPu/mEYw6PAF4AFwI/M7IcEp5Oeb8F+zQduN7P9gFHAc+7+UXg6aoCZjQnrHUxwsbh1dV6/v5m9Gu7/KuD/surfb2YlBJdZ6NDI9kcCo83s38L5TkBxuC6JKSUCaSu+AvQAjnf3aguuKNopu4K7PxcmijOB+8zsx8A24P/cfXwO27jW3R9Jz5jZiIYqufsaC+51cAbwH2b2rLvflMtOuPvHZrYY+BIwjuBGKxDcbepb7v5UM6v4yN3LzewAguvvXAHcQXADnkXu/s/hwPriRl5vwHnuvjqXeCUeNEYgbcXBwLthEhgO1LvnsgX3Yf67u88AZhLc7u9F4GQzS5/z72xm/XLc5vPAl83sADPrTHBa53kzOxzY6e7/Q3Axv4buGVsd9kwa8hDBhcLSvQsIGvXL068xs37hNhvkwd3mrgSusd2XUk9fiviSrKr/IDhFlvYU8C0Lu0cWXJVWYk6JQNqKXwMVZrYcuBj4SwN1TgGWmdkrBEfbt7v7ZoKGcZaZvUZwWujoXDbo7n8mGDt4iWDMYKa7vwIcC7wUnqK5AfiPBl5+N/BaerC4jqcJbgz0jAe3X4Qgca0E/mzBTcvvopkeexjLawQ3ZrkF+EG479mvWwQckx4sJug5dAhjWxHOS8zp66MiIjGnHoGISMwpEYiIxJwSgYhIzCkRiIjEnBKBiEjMKRGIiMScEoGISMz9f/eDjMJHYrtAAAAAAElFTkSuQmCC\n" }, "metadata": { "needs_background": "light" } } ] } ], "metadata": { "kernelspec": { "display_name": "Python 3", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.8.5" }, "colab": { "name": "KerasTuner.ipynb", "provenance": [], "collapsed_sections": [] }, "accelerator": "GPU" }, "nbformat": 4, "nbformat_minor": 0 }