; ; ; ; ; ; ; ; ; ; ; ; ; ; ; ; ; ; ; CuGenDBv2

CsGy2G004980 (gene) of Cucumber (Gy14) v2.1 genome

Gene IDCsGy2G004980
OrganismCucumis sativus L. var. sativus cv. Gy14 (Cucumber (Gy14) v2.1)
DescriptionProtein of unknown function, DUF538
Genome locationGy14Chr2:3440898..3441831
RNA-Seq ExpressionCsGy2G004980
SyntenyCsGy2G004980
Gene Ontology termsNA
InterPro domainsIPR007493 - Protein of unknown function DUF538
IPR036758 - At5g01610-like superfamily


Homology Show/hide homology
GenBank top hitse value%identityAlignment
KAA0048082.1 plant/F25P12-18 protein [Cucumis melo var. makuwa]1.22e-11594.12Show/hide
Query:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK
        MSLITE+IKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK
Subjt:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK

Query:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV
        ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEE+VKVV EKENKE+ENKEKE     NKEK+VVNGA AAAAIEVKEV
Subjt:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV

TYJ96455.1 plant/F25P12-18 protein [Cucumis melo var. makuwa]1.58e-11996.26Show/hide
Query:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK
        MSLITE+IKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK
Subjt:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK

Query:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV
        ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEE+VKVV EKENKE+ENKEKE KEKENKEK+VVNGA AAAAIEVKEV
Subjt:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV

XP_008453262.1 PREDICTED: uncharacterized protein LOC103494033 [Cucumis melo]1.14e-11291.98Show/hide
Query:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK
        MSLITE+IKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK
Subjt:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK

Query:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV
        ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEE+VKVV EKENKE          KENKEK+VVNGA AAAAIEVKEV
Subjt:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV

XP_011648877.1 uncharacterized protein LOC105434559 [Cucumis sativus]4.21e-124100Show/hide
Query:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK
        MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK
Subjt:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK

Query:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV
        ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV
Subjt:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV

XP_038889922.1 uncharacterized protein LOC120079689 [Benincasa hispida]4.88e-10183.96Show/hide
Query:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK
        MSLITE+IKAKADELYYGDEMC+IKSRELLKEMDLPNGLLPMKDMEECG+VKETGFVWLKQKKSYTHKF+DIDRLVTYGTEVTAYVEKNKVKKLTGVKAK
Subjt:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK

Query:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV
        EL++WLPLCDIYVN+PPNGKITFKSTTGLSRTFPVSAFQVEE+VK  EEK+NKE               KEVV  A  AAAIEVKEV
Subjt:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV

TrEMBL top hitse value%identityAlignment
A0A0A0LH04 Uncharacterized protein2.04e-124100Show/hide
Query:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK
        MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK
Subjt:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK

Query:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV
        ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV
Subjt:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV

A0A1S3BV88 uncharacterized protein LOC1034940335.53e-11391.98Show/hide
Query:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK
        MSLITE+IKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK
Subjt:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK

Query:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV
        ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEE+VKVV EKENKE          KENKEK+VVNGA AAAAIEVKEV
Subjt:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV

A0A5A7TX45 Plant/F25P12-18 protein5.89e-11694.12Show/hide
Query:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK
        MSLITE+IKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK
Subjt:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK

Query:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV
        ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEE+VKVV EKENKE+ENKEKE     NKEK+VVNGA AAAAIEVKEV
Subjt:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV

A0A5D3BDB9 Plant/F25P12-18 protein7.64e-12096.26Show/hide
Query:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK
        MSLITE+IKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK
Subjt:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK

Query:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV
        ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEE+VKVV EKENKE+ENKEKE KEKENKEK+VVNGA AAAAIEVKEV
Subjt:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV

A0A6J1G3W7 uncharacterized protein LOC1114505531.78e-8775.53Show/hide
Query:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK
        MSL+TE IKAKADE+Y+GDE+CQ K+RELLKEMDLPNGLLPMKDMEECGI+KETGFVWLKQKKSYTHKF+DI RLVTYG EVTAYVEKNKVKKLTGVKAK
Subjt:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK

Query:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEV-KVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV
        EL+IWL L DIYV+ PP GKITFK+TTGL RTFPVSAF+VEE+V K VE K N E               KEVV+  VAAAAIEVK++
Subjt:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEV-KVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV

SwissProt top hitse value%identityAlignment
No hits found
Arabidopsis top hitse value%identityAlignment
AT1G09310.1 Protein of unknown function, DUF5381.8e-4657.87Show/hide
Query:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK
        M L+TE+++AKA E+Y GDE+C+ K++  LKE+ +PNGLLP+KD+EE G  +E+G VWLKQKKS THKF +ID+LV+YGTEVTA VE  K+KKLTGVKAK
Subjt:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK

Query:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVA
        EL+IW+ + +IY  +PP  KITFK+ T LSRTFPV+AF V EE    +E+  KE   KEK  +  E KE   +  AVA
Subjt:  ELMIWLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVA

AT1G56580.1 Protein of unknown function, DUF5381.6e-4458.75Show/hide
Query:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK
        M L+T++++A+A E Y GDE+C+ K++E LKE+ +PNGLLP+KD+EE G  +ETG VWLKQKKS THKF+ I +LV+Y TEV A VE  K+KKLTGVKAK
Subjt:  MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAK

Query:  ELMIWLPLCDIYVNQP-PNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKE
        EL+IW+ L ++ + QP  +GKI F++ TGLSRTFPVSAF V E  K   EK N   E KE
Subjt:  ELMIWLPLCDIYVNQP-PNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKE

AT4G24130.1 Protein of unknown function, DUF5384.2e-3246.15Show/hide
Query:  ELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAKELMIWLPLCDIYV
        E+ YG E C  +S ELL+E+  P G++P+K++ ECG V+ TG+VW+KQ   Y H F+  +  V+YG EVTAYV+K  +KK+TGVK+K++ +W+P+ ++ +
Subjt:  ELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAKELMIWLPLCDIYV

Query:  NQPPNGKITFKSTTGLSRTFPVSAFQVEEE
         +P + KI FK+  G+ R+FPV+ F  EEE
Subjt:  NQPPNGKITFKSTTGLSRTFPVSAFQVEEE

AT5G46230.1 Protein of unknown function, DUF5382.1e-3144.93Show/hide
Query:  TEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAKELMI
        T+  + +  E+  G+  C+ K++E+L  M+LP GLLP+ +M E G  K TG+VW+K K    H+FK I R V+Y +EVTA +E  ++ +LTG+K+KE++I
Subjt:  TEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAKELMI

Query:  WLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEE
        W+ + +I+VN     +ITF + TGLSRTFPV+AF+ +E
Subjt:  WLPLCDIYVNQPPNGKITFKSTTGLSRTFPVSAFQVEE

AT5G49600.1 Protein of unknown function, DUF5382.2e-2846.07Show/hide
Query:  LITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWL----KQKKSYTHKFKDIDR----LVTYGTEVTAYVEKNKVKKL
        ++TE +KAKA E+Y+GD+ C+ K   LL E+ LPN LL  K+++ECG VK+TGFVWL    K+K+    +++D+ R    +V +  EVTAY E N++KKL
Subjt:  LITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWL----KQKKSYTHKFKDIDR----LVTYGTEVTAYVEKNKVKKL

Query:  TGVKAKELMIWLPLCDIYVNQPPNGKITFKSTTG-LSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKE-KENKEK
        TGVKAKE M+W+ L +I VN+  +G ITFK+  G LS++ P+S F         E+    + + KEK KKE K NK K
Subjt:  TGVKAKELMIWLPLCDIYVNQPPNGKITFKSTTG-LSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKE-KENKEK


Sequences Show/hide sequences
CDS sequenceShow/hide CDS sequence
ATGTCTCTAATCACAGAAGATATCAAAGCCAAAGCTGATGAGCTCTACTATGGAGATGAGATGTGCCAAATCAAATCAAGGGAGCTGCTCAAAGAAATGGATCTTCCAAA
TGGGCTGTTGCCAATGAAAGATATGGAGGAATGTGGGATTGTGAAAGAGACGGGGTTTGTTTGGCTGAAGCAGAAGAAAAGCTACACTCATAAGTTTAAAGACATTGATA
GGTTGGTTACTTATGGCACCGAAGTTACAGCCTATGTGGAGAAAAACAAGGTTAAGAAGCTTACTGGAGTTAAGGCTAAGGAGCTCATGATTTGGCTCCCACTCTGTGAC
ATCTATGTTAATCAACCACCGAACGGGAAAATCACGTTCAAGTCTACGACTGGACTGTCAAGAACTTTCCCCGTGTCAGCCTTTCAGGTTGAAGAAGAAGTCAAGGTTGT
GGAAGAGAAGGAGAACAAAGAGAGGGAGAACAAAGAGAAGGAGAAAAAAGAGAAGGAAAACAAAGAGAAGGAAGTAGTGAACGGAGCAGTTGCAGCTGCAGCTATTGAGG
TGAAGGAGGTTTGA
mRNA sequenceShow/hide mRNA sequence
GTGTGATCAAACAAGGAAAGAAGCTCTAAACTCATAAAAAAAAAATGTCTCTAATCACAGAAGATATCAAAGCCAAAGCTGATGAGCTCTACTATGGAGATGAGATGTGC
CAAATCAAATCAAGGGAGCTGCTCAAAGAAATGGATCTTCCAAATGGGCTGTTGCCAATGAAAGATATGGAGGAATGTGGGATTGTGAAAGAGACGGGGTTTGTTTGGCT
GAAGCAGAAGAAAAGCTACACTCATAAGTTTAAAGACATTGATAGGTTGGTTACTTATGGCACCGAAGTTACAGCCTATGTGGAGAAAAACAAGGTTAAGAAGCTTACTG
GAGTTAAGGCTAAGGAGCTCATGATTTGGCTCCCACTCTGTGACATCTATGTTAATCAACCACCGAACGGGAAAATCACGTTCAAGTCTACGACTGGACTGTCAAGAACT
TTCCCCGTGTCAGCCTTTCAGGTTGAAGAAGAAGTCAAGGTTGTGGAAGAGAAGGAGAACAAAGAGAGGGAGAACAAAGAGAAGGAGAAAAAAGAGAAGGAAAACAAAGA
GAAGGAAGTAGTGAACGGAGCAGTTGCAGCTGCAGCTATTGAGGTGAAGGAGGTTTGAGTTTATTTCTTTGAAGTTACAAGGGGCTCTCTCTTCCTCTTTATTACTGGTT
TGTTGTTGGCTCAAATATGTTAGCTATATGTTCTTTTTTTTCTTTTTTTTATGTTGACAGTTTATTTTATTGAATAAACATTGGTATGAAGTTTACTTACTGTAATCGTG
TTAAACAAAGCTTTAAATGGCTTTTCTGGGCGGGGGAGGGAGATGGATGACTTTTAGCGAATGGAAATGTATTATTGTCAAATAATTTACACATAAGATGTTCAAGGAGA
GCCCACAGATCAATATTCAGGCTCTCTCTCAGTTCTAAAAAAATCTATTGCCAA
Protein sequenceShow/hide protein sequence
MSLITEDIKAKADELYYGDEMCQIKSRELLKEMDLPNGLLPMKDMEECGIVKETGFVWLKQKKSYTHKFKDIDRLVTYGTEVTAYVEKNKVKKLTGVKAKELMIWLPLCD
IYVNQPPNGKITFKSTTGLSRTFPVSAFQVEEEVKVVEEKENKERENKEKEKKEKENKEKEVVNGAVAAAAIEVKEV