; ; ; ; ; ; ; ; ; ; ; ; ; ; ; ; ; ; ; CuGenDBv2

Tan0014917 (gene) of Snake gourd v1 genome

Gene IDTan0014917
OrganismTrichosanthes anguina (Snake gourd v1)
Descriptionprotein COFACTOR ASSEMBLY OF COMPLEX C SUBUNIT B CCB2, chloroplastic
Genome locationLG01:2433542..2436527
RNA-Seq ExpressionTan0014917
SyntenyTan0014917
Gene Ontology termsGO:0010190 - cytochrome b6f complex assembly (biological process)
InterPro domainsIPR021325 - Cofactor assembly of complex C subunit B, CCB2/CCB4
IPR044970 - COFACTOR ASSEMBLY OF COMPLEX C SUBUNIT B CCB2, chloroplastic


Homology Show/hide homology
GenBank top hitse value%identityAlignment
XP_022141087.1 protein COFACTOR ASSEMBLY OF COMPLEX C SUBUNIT B CCB2, chloroplastic isoform X1 [Momordica charantia]5.4e-10589.04Show/hide
Query:  MTSTILSSSPLIWLSSTPRFGAKSRLKSPAISARLDDSKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEG
        MT +ILS +PLI L+STPRF AK+RLK+PA+SARLDDSKNS NQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHF GSNSAAP TPAQLRTE 
Subjt:  MTSTILSSSPLIWLSSTPRFGAKSRLKSPAISARLDDSKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEG

Query:  LGISLAAFSIALPYLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQ
        LG+SLAAFSIALPYLG+FLKGAVPSGEA+LPEG EQIFV+SQNVSDNVKEDLAWATYILLRNTNSISVLI+I+GELCVRGYWNSPNDI GADL+AWFEEQ
Subjt:  LGISLAAFSIALPYLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQ

Query:  LQSIGLSALNDALYFPQIS
        LQSIGLSALND LYFPQIS
Subjt:  LQSIGLSALNDALYFPQIS

XP_022141092.1 protein COFACTOR ASSEMBLY OF COMPLEX C SUBUNIT B CCB2, chloroplastic isoform X3 [Momordica charantia]1.1e-10589.09Show/hide
Query:  MTSTILSSSPLIWLSSTPRFGAKSRLKSPAISARLDDSKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEG
        MT +ILS +PLI L+STPRF AK+RLK+PA+SARLDDSKNS NQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHF GSNSAAP TPAQLRTE 
Subjt:  MTSTILSSSPLIWLSSTPRFGAKSRLKSPAISARLDDSKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEG

Query:  LGISLAAFSIALPYLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQ
        LG+SLAAFSIALPYLG+FLKGAVPSGEA+LPEG EQIFV+SQNVSDNVKEDLAWATYILLRNTNSISVLI+I+GELCVRGYWNSPNDI GADL+AWFEEQ
Subjt:  LGISLAAFSIALPYLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQ

Query:  LQSIGLSALNDALYFPQISG
        LQSIGLSALND LYFPQISG
Subjt:  LQSIGLSALNDALYFPQISG

XP_022968386.1 protein COFACTOR ASSEMBLY OF COMPLEX C SUBUNIT B CCB2, chloroplastic isoform X1 [Cucurbita maxima]5.9e-10489.95Show/hide
Query:  MTSTILSSSPLIWLSSTPRFGAKSRLKSPAISARLDDSKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEG
        M+ TILS  PLI LSSTPRF AK+  KSP I+ARLDDSKNS N+QLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGS+SAAPIT AQLRTE 
Subjt:  MTSTILSSSPLIWLSSTPRFGAKSRLKSPAISARLDDSKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEG

Query:  LGISLAAFSIALPYLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQ
        LGISLAAFSIALPYLG+FL+GAVPSGEATLPEGAEQIFV+SQNVSDNVK+DLAWATYILLRNTNSISVLI IQGELCVRGYWNSPNDISGADLLAWFEEQ
Subjt:  LGISLAAFSIALPYLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQ

Query:  LQSIGLSALNDALYFPQIS
        LQSIGLSALND+LYFPQIS
Subjt:  LQSIGLSALNDALYFPQIS

XP_022968395.1 protein COFACTOR ASSEMBLY OF COMPLEX C SUBUNIT B CCB2, chloroplastic isoform X2 [Cucurbita maxima]5.9e-10489.95Show/hide
Query:  MTSTILSSSPLIWLSSTPRFGAKSRLKSPAISARLDDSKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEG
        M+ TILS  PLI LSSTPRF AK+  KSP I+ARLDDSKNS N+QLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGS+SAAPIT AQLRTE 
Subjt:  MTSTILSSSPLIWLSSTPRFGAKSRLKSPAISARLDDSKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEG

Query:  LGISLAAFSIALPYLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQ
        LGISLAAFSIALPYLG+FL+GAVPSGEATLPEGAEQIFV+SQNVSDNVK+DLAWATYILLRNTNSISVLI IQGELCVRGYWNSPNDISGADLLAWFEEQ
Subjt:  LGISLAAFSIALPYLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQ

Query:  LQSIGLSALNDALYFPQIS
        LQSIGLSALND+LYFPQIS
Subjt:  LQSIGLSALNDALYFPQIS

XP_023542853.1 protein COFACTOR ASSEMBLY OF COMPLEX C SUBUNIT B CCB2, chloroplastic [Cucurbita pepo subsp. pepo]1.0e-10389.95Show/hide
Query:  MTSTILSSSPLIWLSSTPRFGAKSRLKSPAISARLDDSKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEG
        M+ TILS  PLI LSST RF AK+  KSP I+ARLDDSKNS N+QLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPIT AQLRTE 
Subjt:  MTSTILSSSPLIWLSSTPRFGAKSRLKSPAISARLDDSKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEG

Query:  LGISLAAFSIALPYLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQ
        LGISLAAFSIALPYLG+FL+GAVPSGEATLPEGAEQIFV+SQNVSDNVK+DLAWATYILLRNTNSISVLI+IQGELCVRGYWNSPNDISG DLLAWFEEQ
Subjt:  LGISLAAFSIALPYLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQ

Query:  LQSIGLSALNDALYFPQIS
        LQSIGLSALNDALYFPQIS
Subjt:  LQSIGLSALNDALYFPQIS

TrEMBL top hitse value%identityAlignment
A0A6J1CIW2 protein COFACTOR ASSEMBLY OF COMPLEX C SUBUNIT B CCB2, chloroplastic isoform X35.2e-10689.09Show/hide
Query:  MTSTILSSSPLIWLSSTPRFGAKSRLKSPAISARLDDSKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEG
        MT +ILS +PLI L+STPRF AK+RLK+PA+SARLDDSKNS NQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHF GSNSAAP TPAQLRTE 
Subjt:  MTSTILSSSPLIWLSSTPRFGAKSRLKSPAISARLDDSKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEG

Query:  LGISLAAFSIALPYLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQ
        LG+SLAAFSIALPYLG+FLKGAVPSGEA+LPEG EQIFV+SQNVSDNVKEDLAWATYILLRNTNSISVLI+I+GELCVRGYWNSPNDI GADL+AWFEEQ
Subjt:  LGISLAAFSIALPYLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQ

Query:  LQSIGLSALNDALYFPQISG
        LQSIGLSALND LYFPQISG
Subjt:  LQSIGLSALNDALYFPQISG

A0A6J1CJH9 protein COFACTOR ASSEMBLY OF COMPLEX C SUBUNIT B CCB2, chloroplastic isoform X12.6e-10589.04Show/hide
Query:  MTSTILSSSPLIWLSSTPRFGAKSRLKSPAISARLDDSKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEG
        MT +ILS +PLI L+STPRF AK+RLK+PA+SARLDDSKNS NQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHF GSNSAAP TPAQLRTE 
Subjt:  MTSTILSSSPLIWLSSTPRFGAKSRLKSPAISARLDDSKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEG

Query:  LGISLAAFSIALPYLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQ
        LG+SLAAFSIALPYLG+FLKGAVPSGEA+LPEG EQIFV+SQNVSDNVKEDLAWATYILLRNTNSISVLI+I+GELCVRGYWNSPNDI GADL+AWFEEQ
Subjt:  LGISLAAFSIALPYLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQ

Query:  LQSIGLSALNDALYFPQIS
        LQSIGLSALND LYFPQIS
Subjt:  LQSIGLSALNDALYFPQIS

A0A6J1G0N4 protein COFACTOR ASSEMBLY OF COMPLEX C SUBUNIT B CCB2, chloroplastic8.3e-10489.5Show/hide
Query:  MTSTILSSSPLIWLSSTPRFGAKSRLKSPAISARLDDSKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEG
        M+ TILS  PLI LSSTPRF AK+  KSP I+ARLDDSKNS ++QLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGS+SAAPIT AQLRTE 
Subjt:  MTSTILSSSPLIWLSSTPRFGAKSRLKSPAISARLDDSKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEG

Query:  LGISLAAFSIALPYLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQ
        LGISLAAFSIALPYLG+FL+GAVPSGEATLPEGAEQIFV+SQ+VSDNVK+DLAWATYILLRNTNSISVLI+IQGELCVRGYWNSPNDISGADLLAWFEEQ
Subjt:  LGISLAAFSIALPYLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQ

Query:  LQSIGLSALNDALYFPQIS
        LQSIGLSALNDALYFPQIS
Subjt:  LQSIGLSALNDALYFPQIS

A0A6J1HX31 protein COFACTOR ASSEMBLY OF COMPLEX C SUBUNIT B CCB2, chloroplastic isoform X22.9e-10489.95Show/hide
Query:  MTSTILSSSPLIWLSSTPRFGAKSRLKSPAISARLDDSKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEG
        M+ TILS  PLI LSSTPRF AK+  KSP I+ARLDDSKNS N+QLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGS+SAAPIT AQLRTE 
Subjt:  MTSTILSSSPLIWLSSTPRFGAKSRLKSPAISARLDDSKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEG

Query:  LGISLAAFSIALPYLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQ
        LGISLAAFSIALPYLG+FL+GAVPSGEATLPEGAEQIFV+SQNVSDNVK+DLAWATYILLRNTNSISVLI IQGELCVRGYWNSPNDISGADLLAWFEEQ
Subjt:  LGISLAAFSIALPYLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQ

Query:  LQSIGLSALNDALYFPQIS
        LQSIGLSALND+LYFPQIS
Subjt:  LQSIGLSALNDALYFPQIS

A0A6J1HXW3 protein COFACTOR ASSEMBLY OF COMPLEX C SUBUNIT B CCB2, chloroplastic isoform X12.9e-10489.95Show/hide
Query:  MTSTILSSSPLIWLSSTPRFGAKSRLKSPAISARLDDSKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEG
        M+ TILS  PLI LSSTPRF AK+  KSP I+ARLDDSKNS N+QLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGS+SAAPIT AQLRTE 
Subjt:  MTSTILSSSPLIWLSSTPRFGAKSRLKSPAISARLDDSKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEG

Query:  LGISLAAFSIALPYLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQ
        LGISLAAFSIALPYLG+FL+GAVPSGEATLPEGAEQIFV+SQNVSDNVK+DLAWATYILLRNTNSISVLI IQGELCVRGYWNSPNDISGADLLAWFEEQ
Subjt:  LGISLAAFSIALPYLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQ

Query:  LQSIGLSALNDALYFPQIS
        LQSIGLSALND+LYFPQIS
Subjt:  LQSIGLSALNDALYFPQIS

SwissProt top hitse value%identityAlignment
Q9FJ81 Protein COFACTOR ASSEMBLY OF COMPLEX C SUBUNIT B CCB2, chloroplastic1.5e-6559.42Show/hide
Query:  PRFGAKSRL-KSPAISARLDD---SKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEGLGISLAAFSIALP
        P+F  + R  +S  I AR ++      + +QQLNLSVLRFT GIPG DESYLPRWIGYGFGSLLLLNHF   +++API+ +Q+R+E LG+SLAAFSIALP
Subjt:  PRFGAKSRL-KSPAISARLDD---SKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEGLGISLAAFSIALP

Query:  YLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQLQSIGLSALNDAL
        Y+G+FLKG+V   + +LPE  EQ+FV+S N+ D++KEDLAWATY+LLRNT++I+VLI +QGELCVRGYWN P+ +S A L  WF++++  IGL+ + + L
Subjt:  YLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQLQSIGLSALNDAL

Query:  YFPQISG
        YFPQ +G
Subjt:  YFPQISG

Arabidopsis top hitse value%identityAlignment
AT5G52110.1 Protein of unknown function (DUF2930)1.1e-6659.42Show/hide
Query:  PRFGAKSRL-KSPAISARLDD---SKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEGLGISLAAFSIALP
        P+F  + R  +S  I AR ++      + +QQLNLSVLRFT GIPG DESYLPRWIGYGFGSLLLLNHF   +++API+ +Q+R+E LG+SLAAFSIALP
Subjt:  PRFGAKSRL-KSPAISARLDD---SKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEGLGISLAAFSIALP

Query:  YLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQLQSIGLSALNDAL
        Y+G+FLKG+V   + +LPE  EQ+FV+S N+ D++KEDLAWATY+LLRNT++I+VLI +QGELCVRGYWN P+ +S A L  WF++++  IGL+ + + L
Subjt:  YLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQLQSIGLSALNDAL

Query:  YFPQISG
        YFPQ +G
Subjt:  YFPQISG

AT5G52110.2 Protein of unknown function (DUF2930)1.1e-6659.42Show/hide
Query:  PRFGAKSRL-KSPAISARLDD---SKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEGLGISLAAFSIALP
        P+F  + R  +S  I AR ++      + +QQLNLSVLRFT GIPG DESYLPRWIGYGFGSLLLLNHF   +++API+ +Q+R+E LG+SLAAFSIALP
Subjt:  PRFGAKSRL-KSPAISARLDD---SKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEGLGISLAAFSIALP

Query:  YLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQLQSIGLSALNDAL
        Y+G+FLKG+V   + +LPE  EQ+FV+S N+ D++KEDLAWATY+LLRNT++I+VLI +QGELCVRGYWN P+ +S A L  WF++++  IGL+ + + L
Subjt:  YLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQLQSIGLSALNDAL

Query:  YFPQISG
        YFPQ +G
Subjt:  YFPQISG


Sequences Show/hide sequences
CDS sequenceShow/hide CDS sequence
ATGACCAGCACAATTCTCTCTTCCAGCCCGTTAATTTGGTTGTCATCCACTCCCCGATTTGGCGCTAAAAGTAGGTTGAAGAGTCCAGCAATTTCTGCTCGTCTTGACGA
TTCTAAGAACTCGGGCAATCAGCAACTCAATCTCTCTGTCCTTCGCTTCACACTCGGGATTCCTGGATTGGATGAGTCTTACTTACCCAGATGGATTGGTTATGGATTTG
GTTCGCTTCTGCTTTTGAATCACTTTGTTGGTTCGAATTCAGCTGCTCCCATCACCCCGGCACAGCTAAGAACTGAGGGTTTAGGCATTTCGTTGGCAGCATTTTCTATT
GCACTCCCCTACTTGGGAAGGTTTCTTAAGGGTGCAGTTCCATCTGGTGAAGCTACCCTCCCTGAAGGTGCTGAGCAAATATTTGTCATGTCACAAAATGTGTCGGATAA
TGTGAAGGAAGACTTGGCTTGGGCAACATACATCTTGCTACGCAATACAAACAGTATATCAGTGTTAATAAAGATTCAAGGAGAGTTATGTGTTCGAGGATACTGGAATA
GTCCAAATGATATATCAGGAGCAGATTTACTTGCCTGGTTTGAGGAGCAGCTTCAAAGCATTGGCCTGTCTGCATTAAATGATGCCCTCTATTTTCCTCAGATTTCAGGT
ATATGA
mRNA sequenceShow/hide mRNA sequence
AAAAGCTTCAATTAAGGAAAAAAAAAAAAGAGAACGGATTTGGATGTGGATCAAGCAGGGAAGTGTCCGGCCCATTGATCTTGCAGTAGAATTTAGAGAATTTTCTCGAT
TGCCATACAAGGAAAGAACATGACCAGCACAATTCTCTCTTCCAGCCCGTTAATTTGGTTGTCATCCACTCCCCGATTTGGCGCTAAAAGTAGGTTGAAGAGTCCAGCAA
TTTCTGCTCGTCTTGACGATTCTAAGAACTCGGGCAATCAGCAACTCAATCTCTCTGTCCTTCGCTTCACACTCGGGATTCCTGGATTGGATGAGTCTTACTTACCCAGA
TGGATTGGTTATGGATTTGGTTCGCTTCTGCTTTTGAATCACTTTGTTGGTTCGAATTCAGCTGCTCCCATCACCCCGGCACAGCTAAGAACTGAGGGTTTAGGCATTTC
GTTGGCAGCATTTTCTATTGCACTCCCCTACTTGGGAAGGTTTCTTAAGGGTGCAGTTCCATCTGGTGAAGCTACCCTCCCTGAAGGTGCTGAGCAAATATTTGTCATGT
CACAAAATGTGTCGGATAATGTGAAGGAAGACTTGGCTTGGGCAACATACATCTTGCTACGCAATACAAACAGTATATCAGTGTTAATAAAGATTCAAGGAGAGTTATGT
GTTCGAGGATACTGGAATAGTCCAAATGATATATCAGGAGCAGATTTACTTGCCTGGTTTGAGGAGCAGCTTCAAAGCATTGGCCTGTCTGCATTAAATGATGCCCTCTA
TTTTCCTCAGATTTCAGGTATATGATTGCATTTTCCATGAACGTCTTTTTTACTCTCTTGATGCACATGAAATAATGTCTTAGAAACGACCATAATTAGTGGAGAAAATG
TTGTTATCTCCTTAAAAATTCGCTTATGGCCACAAATGGAGTAATTAGATAAAATAGGTTGAAGATCAGTAGTTGTAACTTTGAATTTCTATATTATGTTTAAAGTTAGA
ATGATAGACCACTGATAGCAATAGTACATGTGTACTAGAAGAAATGAAGAATGTAAAGGGGGCGGCCTAGAGCATGGGATCTTGTAGTACTCTAAAGGACTTAGGGTTTG
ATTATCAACCGCTATCAAAACTTGAAGTAATCTGCAATGTCATATAAATATTGGTTTCTTTTCCTTATGGTGATGAGGTGCTTCTCTTGGTTCTTTCTCTGATTAAACAT
GCACTGATGGTAATAGATAGTTAAACAAATACTATGGTGTTTTATGAAACTGTTAGGAATCCTCTGGTTTCCCTGTATAAACACACAGAAAAACACCCAAACGACACTG
Protein sequenceShow/hide protein sequence
MTSTILSSSPLIWLSSTPRFGAKSRLKSPAISARLDDSKNSGNQQLNLSVLRFTLGIPGLDESYLPRWIGYGFGSLLLLNHFVGSNSAAPITPAQLRTEGLGISLAAFSI
ALPYLGRFLKGAVPSGEATLPEGAEQIFVMSQNVSDNVKEDLAWATYILLRNTNSISVLIKIQGELCVRGYWNSPNDISGADLLAWFEEQLQSIGLSALNDALYFPQISG
I