; ; ; ; ; ; ; ; ; ; ; ; ; ; ; ; ; ; ; CuGenDBv2

Cucsat.G21189 (gene) of Cucumber (B10) v3 genome

Gene IDCucsat.G21189
OrganismCucumis sativus L. var. sativus cv. B10 (Cucumber (B10) v3)
DescriptionUnknown protein
Genome locationctg910:3285427..3291271
RNA-Seq ExpressionCucsat.G21189
SyntenyCucsat.G21189
Gene Ontology termsGO:0016021 - integral component of membrane (cellular component)
InterPro domainsNA


Homology Show/hide homology
GenBank top hitse value%identityAlignment
XP_004143669.1 uncharacterized protein LOC101219174 [Cucumis sativus]6.58e-18099.19Show/hide
Query:  MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD
        MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD
Subjt:  MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD

Query:  RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG
        RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG
Subjt:  RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG

Query:  YKNQIISCAGCGNVVWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK
        YKNQIISCAGCGNVVWQPK  GEYNSRKGSSGSKSQPNVIDVEFEEK
Subjt:  YKNQIISCAGCGNVVWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK

XP_008467324.1 PREDICTED: uncharacterized protein LOC103504702 [Cucumis melo]4.44e-17395.95Show/hide
Query:  MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD
        MIASTPLPPWQPPL AP RLRRSRPLIIPYRTPIGFVQAYRRGGG  NNDAFG+AWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRV SAAQSVAD
Subjt:  MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD

Query:  RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG
        RAREIDREFAIG+RWRNFTLDFSRNWPRYRRQLNEFIDTPLGKS VTIFFLWFALSGWLFRFLIFGTWILPFAGPIL+GTFANSLVIKGNCPACNREFAG
Subjt:  RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG

Query:  YKNQIISCAGCGNVVWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK
        YKNQIISCAGCGN+VWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK
Subjt:  YKNQIISCAGCGNVVWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK

XP_022159671.1 uncharacterized protein LOC111026015 [Momordica charantia]1.40e-15287.45Show/hide
Query:  MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD
        MIAST LPPWQPPLQAP RLRR RP  IP R  +GFVQAYRRG    N+D FG+AWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRV S AQS A+
Subjt:  MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD

Query:  RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG
        RAREIDREF IG+RWRNFTLDFSRNWPRYRRQLNEF+DTPLGKS VTIFFLWFALSGWLFRFLIF TWILPFAGP+LIGTFANSL+IKG CPACNREFAG
Subjt:  RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG

Query:  YKNQIISCAGCGNVVWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK
        YKNQIISC+GCGN+VWQPKGQGEYNSRKG+SGSKSQPNVIDVEFEEK
Subjt:  YKNQIISCAGCGNVVWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK

XP_022957921.1 uncharacterized protein LOC111459308 [Cucurbita moschata]9.45e-15485.83Show/hide
Query:  MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD
        MIAST LPPWQPPL+AP RL R+RPL+IP R  +GFVQAYRRGGG  NND FG+ W+KVWRGANDGFEKFVFEARKTAERLDRRYSVSRRV S AQS AD
Subjt:  MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD

Query:  RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG
        RAREIDREF IG+RWRNFTLDFSRNWPRYRRQLNEF+DTPLGK  VTIFFLWFALSGWLFR LIF TWILPFAGP+LIGTFANSL+IKG CPACNREFAG
Subjt:  RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG

Query:  YKNQIISCAGCGNVVWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK
        YKNQIISC GCGN+VWQPKGQGE  +RKG SGSKSQPNVIDVEFEEK
Subjt:  YKNQIISCAGCGNVVWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK

XP_038874339.1 uncharacterized protein LOC120067037 [Benincasa hispida]3.60e-16390.28Show/hide
Query:  MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD
        MIASTPLPPWQPP+QAP RLRRSR L+IPYR  IGFVQAYRRGGG  N+D FG+AWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRV S AQS AD
Subjt:  MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD

Query:  RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG
        RAREIDREF IG+RWRNFTLDFSRNWPRYRRQLNEF+DTPLGKS VTIFFLWFALSGWLFRFLIF TWILPFAGP+LIG+FANSLVIKG CPACNREFAG
Subjt:  RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG

Query:  YKNQIISCAGCGNVVWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK
        YKNQIISC GCGN+VWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK
Subjt:  YKNQIISCAGCGNVVWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK

TrEMBL top hitse value%identityAlignment
A0A0A0KPH9 Uncharacterized protein3.18e-18099.19Show/hide
Query:  MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD
        MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD
Subjt:  MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD

Query:  RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG
        RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG
Subjt:  RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG

Query:  YKNQIISCAGCGNVVWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK
        YKNQIISCAGCGNVVWQPK  GEYNSRKGSSGSKSQPNVIDVEFEEK
Subjt:  YKNQIISCAGCGNVVWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK

A0A1S3CT98 uncharacterized protein LOC1035047022.15e-17395.95Show/hide
Query:  MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD
        MIASTPLPPWQPPL AP RLRRSRPLIIPYRTPIGFVQAYRRGGG  NNDAFG+AWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRV SAAQSVAD
Subjt:  MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD

Query:  RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG
        RAREIDREFAIG+RWRNFTLDFSRNWPRYRRQLNEFIDTPLGKS VTIFFLWFALSGWLFRFLIFGTWILPFAGPIL+GTFANSLVIKGNCPACNREFAG
Subjt:  RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG

Query:  YKNQIISCAGCGNVVWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK
        YKNQIISCAGCGN+VWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK
Subjt:  YKNQIISCAGCGNVVWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK

A0A6J1E4L9 uncharacterized protein LOC1110260156.80e-15387.45Show/hide
Query:  MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD
        MIAST LPPWQPPLQAP RLRR RP  IP R  +GFVQAYRRG    N+D FG+AWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRV S AQS A+
Subjt:  MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD

Query:  RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG
        RAREIDREF IG+RWRNFTLDFSRNWPRYRRQLNEF+DTPLGKS VTIFFLWFALSGWLFRFLIF TWILPFAGP+LIGTFANSL+IKG CPACNREFAG
Subjt:  RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG

Query:  YKNQIISCAGCGNVVWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK
        YKNQIISC+GCGN+VWQPKGQGEYNSRKG+SGSKSQPNVIDVEFEEK
Subjt:  YKNQIISCAGCGNVVWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK

A0A6J1H0K1 uncharacterized protein LOC1114593084.57e-15485.83Show/hide
Query:  MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD
        MIAST LPPWQPPL+AP RL R+RPL+IP R  +GFVQAYRRGGG  NND FG+ W+KVWRGANDGFEKFVFEARKTAERLDRRYSVSRRV S AQS AD
Subjt:  MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD

Query:  RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG
        RAREIDREF IG+RWRNFTLDFSRNWPRYRRQLNEF+DTPLGK  VTIFFLWFALSGWLFR LIF TWILPFAGP+LIGTFANSL+IKG CPACNREFAG
Subjt:  RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG

Query:  YKNQIISCAGCGNVVWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK
        YKNQIISC GCGN+VWQPKGQGE  +RKG SGSKSQPNVIDVEFEEK
Subjt:  YKNQIISCAGCGNVVWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK

A0A6J1K7K5 uncharacterized protein LOC1114913572.17e-15285.02Show/hide
Query:  MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD
        MIAST LPPWQP L+AP RL R+RPL+IP R  +GFVQAYRRGGG  NND FG+ W+KVWRGANDGFEKFVFEARKTAERLDRRYSVSRRV S AQS AD
Subjt:  MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVAD

Query:  RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG
        RAREIDREF IG+RWRNFTLDFSRNWPRYRRQLN+F+DTPLGK  VTIFFLWFALSGWLFR LIF TWILPFAGP+LIGTFANSL+IKG CPACNREFAG
Subjt:  RAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAG

Query:  YKNQIISCAGCGNVVWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK
        YKNQIISC GCGN+VWQPKGQGE  +RKG SGSKSQPNVIDVEFEEK
Subjt:  YKNQIISCAGCGNVVWQPKGQGEYNSRKGSSGSKSQPNVIDVEFEEK

SwissProt top hitse value%identityAlignment
No hits found
Arabidopsis top hitse value%identityAlignment
AT2G44870.1 unknown protein7.9e-7159.46Show/hide
Query:  VQAYRRGGGG--GNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVADRAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLN
        V+A++RG      +N   G AW   WR ANDGFE+FVFEA+KTAER+DR+Y+VSRR  SAA S ADRAREIDREF I  R R  + DFSRN+P+YR+Q +
Subjt:  VQAYRRGGGG--GNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVADRAREIDREFAIGMRWRNFTLDFSRNWPRYRRQLN

Query:  EFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAGYKNQIISCAGCGNVVWQPKG---------QGEYN
         F++TPLG S  TIFFLWFALSGWLFR +I  TW+LP AGP+LIG  AN+ VIKG CPAC R+F GYKNQII C GCGN+VWQP+G             N
Subjt:  EFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAGYKNQIISCAGCGNVVWQPKG---------QGEYN

Query:  SRKGSSGSKSQPNVIDVEFEEK
        + KG+S    +  +IDV+FEEK
Subjt:  SRKGSSGSKSQPNVIDVEFEEK


Sequences Show/hide sequences
CDS sequenceShow/hide CDS sequence
ATGATAGCTTCAACACCTCTGCCGCCATGGCAGCCACCGCTTCAAGCTCCATTCAGATTGAGGAGGAGTAGGCCTTTAATAATCCCTTACCGGACCCCTATTGGCTTCGT
TCAGGCATACCGTCGCGGGGGCGGCGGCGGAAACAACGACGCTTTTGGCGACGCCTGGAACAAAGTATGGCGAGGCGCCAACGATGGGTTTGAGAAATTCGTATTCGAGG
CCAGGAAAACTGCGGAGCGTCTTGATAGGCGTTACTCTGTATCGCGCCGTGTTGGTTCTGCTGCTCAATCGGTGGCCGACCGGGCGCGCGAGATTGATAGGGAGTTTGCA
ATTGGAATGCGTTGGCGTAATTTTACATTGGATTTTAGCAGAAATTGGCCAAGGTATAGGAGGCAACTCAATGAGTTTATCGACACGCCATTAGGAAAAAGTGTTGTGAC
AATATTCTTCCTTTGGTTTGCTTTGTCTGGATGGCTTTTCCGGTTCTTGATATTTGGAACGTGGATACTACCATTTGCTGGTCCAATACTCATTGGGACTTTTGCCAATA
GCCTTGTAATAAAGGGTAATTGTCCAGCCTGTAATAGAGAATTTGCTGGGTACAAGAACCAAATTATTTCTTGCGCAGGATGTGGAAACGTAGTGTGGCAGCCCAAAGGC
CAAGGGGAATACAATTCAAGAAAAGGAAGTTCTGGTTCCAAGTCACAACCCAATGTCATTGATGTGGAGTTTGAGGAGAAATGA
mRNA sequenceShow/hide mRNA sequence
ATGATAGCTTCAACACCTCTGCCGCCATGGCAGCCACCGCTTCAAGCTCCATTCAGATTGAGGAGGAGTAGGCCTTTAATAATCCCTTACCGGACCCCTATTGGCTTCGT
TCAGGCATACCGTCGCGGGGGCGGCGGCGGAAACAACGACGCTTTTGGCGACGCCTGGAACAAAGTATGGCGAGGCGCCAACGATGGGTTTGAGAAATTCGTATTCGAGG
CCAGGAAAACTGCGGAGCGTCTTGATAGGCGTTACTCTGTATCGCGCCGTGTTGGTTCTGCTGCTCAATCGGTGGCCGACCGGGCGCGCGAGATTGATAGGGAGTTTGCA
ATTGGAATGCGTTGGCGTAATTTTACATTGGATTTTAGCAGAAATTGGCCAAGGTATAGGAGGCAACTCAATGAGTTTATCGACACGCCATTAGGAAAAAGTGTTGTGAC
AATATTCTTCCTTTGGTTTGCTTTGTCTGGATGGCTTTTCCGGTTCTTGATATTTGGAACGTGGATACTACCATTTGCTGGTCCAATACTCATTGGGACTTTTGCCAATA
GCCTTGTAATAAAGGGTAATTGTCCAGCCTGTAATAGAGAATTTGCTGGGTACAAGAACCAAATTATTTCTTGCGCAGGATGTGGAAACGTAGTGTGGCAGCCCAAAGGC
CAAGGGGAATACAATTCAAGAAAAGGAAGTTCTGGTTCCAAGTCACAACCCAATGTCATTGATGTGGAGTTTGAGGAGAAATGA
Protein sequenceShow/hide protein sequence
MIASTPLPPWQPPLQAPFRLRRSRPLIIPYRTPIGFVQAYRRGGGGGNNDAFGDAWNKVWRGANDGFEKFVFEARKTAERLDRRYSVSRRVGSAAQSVADRAREIDREFA
IGMRWRNFTLDFSRNWPRYRRQLNEFIDTPLGKSVVTIFFLWFALSGWLFRFLIFGTWILPFAGPILIGTFANSLVIKGNCPACNREFAGYKNQIISCAGCGNVVWQPKG
QGEYNSRKGSSGSKSQPNVIDVEFEEK