; ; ; ; ; ; ; ; ; ; ; ; ; ; ; ; ; ; ; CuGenDBv2

Cmc08g0225851 (gene) of Melon (Charmono) v1.1 genome

Gene IDCmc08g0225851
OrganismCucumis melo var. cantalupensis cv. Charmono (Melon (Charmono) v1.1)
DescriptionGag/pol protein
Genome locationCMiso1.1chr08:17176828..17177844
RNA-Seq ExpressionCmc08g0225851
SyntenyCmc08g0225851
Gene Ontology termsGO:0006508 - proteolysis (biological process)
GO:0015074 - DNA integration (biological process)
GO:0003676 - nucleic acid binding (molecular function)
GO:0008234 - cysteine-type peptidase activity (molecular function)
GO:0008270 - zinc ion binding (molecular function)
InterPro domainsIPR013103 - Reverse transcriptase, RNA-dependent DNA polymerase
IPR043502 - DNA/RNA polymerase superfamily


Homology Show/hide homology
GenBank top hitse value%identityAlignment
ADJ18449.1 gag/pol protein, partial [Bryonia dioica]6.2e-16184.64Show/hide
Query:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE
        MESMY NSVWTLVD  +DVKPIGCKWIYKRKRDQAGKVQTFKARLV KGYTQKEG++Y ETFSPVAM+KSIRILLSI TFY+YEIWQMDVKTAFLN +LE
Subjt:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE

Query:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQ
        ESIYMVQPEGFI + QEQ VCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYK+I+NS VAFL++YVDDILLIGNDV +LTD+KKWL TQFQ
Subjt:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQ

Query:  MKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSVG
        MKDLG AQY+LGIQIVRNRKNKTLAMSQ SYIDK+LSRYKMQNSKKG LP+ +GIHLSKEQCPKTPQEVEDM NI Y+ A+GSLMYAMLCT PDICYSVG
Subjt:  MKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSVG

Query:  IVSRYQSNLGRDHWTVVKNILNILEEQKTTCL
        IVSRYQSN GRDHWT VKNIL  L   +   L
Subjt:  IVSRYQSNLGRDHWTVVKNILNILEEQKTTCL

KAA0025945.1 gag/pol protein [Cucumis melo var. makuwa]4.9e-15079.88Show/hide
Query:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE
        MESMY NSVW LVD    VKPIGCKWIYKRKRD AGKVQTFKARLV KGYTQ+EG++Y ETFSPVAM+KSIRILLSI TFYDYEIWQMDVKTAFLN +LE
Subjt:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE

Query:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQ
        ESI+M QPEGFI +GQEQ VCKL +SIYGLKQASRSWNIRFDTAIKSYGF+QNVDEPCVYK+I    VAFLV+YVDDILLIGNDVG+LTD+K WLA QFQ
Subjt:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQ

Query:  MKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSVG
        MKDLG AQYVLGIQI+R+RKNKTLA+SQ +YIDK+L RY MQNSKKGLLP+ +G+HLSKEQ PKTPQEVEDM  I YA A+GSLMYAMLCT PDICY+VG
Subjt:  MKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSVG

Query:  IVSRYQSNLGRDHWTVVKNILNILEEQK
        IVSRYQSN G DHWT VK +L  L   +
Subjt:  IVSRYQSNLGRDHWTVVKNILNILEEQK

KAA0045356.1 gag/pol protein [Cucumis melo var. makuwa]3.2e-15790.2Show/hide
Query:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE
        MESMYSNSVWTLVDQ N+++PIGCKWIYKRKRDQ  KVQTF+ARLV KGYTQKEGI+Y ETFSP+AMIKSIRILLSI TFYDYEIWQMDVKTAFLN +LE
Subjt:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE

Query:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQ
        ESIYMVQPEGFIQKGQEQ VCKLQKSIYGLKQASRSWNIRFDT IKSYGFEQNVDEPCVYKRIINSTVAFLV+YVDDILLIGN+V HLTDIK+WL TQFQ
Subjt:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQ

Query:  MKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSVG
        MKDLG+AQYVLGIQIV+NRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPY YGIHLSKEQCPKTPQEV+DMSNI YA A+GSLMYAMLC  PDICYSVG
Subjt:  MKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSVG

Query:  IVSRYQ
        IVSRYQ
Subjt:  IVSRYQ

KAA0059226.1 gag/pol protein [Cucumis melo var. makuwa]4.9e-15079.88Show/hide
Query:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE
        MESMY NSVW LVD    VKPIGCKWIYKRKRD AGKVQTFKARLV KGYTQ+EG++Y ETFSPVAM+KSIRILLSI TFYDYEIWQMDVKTAFLN +LE
Subjt:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE

Query:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQ
        ESI+M QPEGFI +GQEQ VCKL +SIYGLKQASRSWNIRFDTAIKSYGF+QNVDEPCVYK+I    VAFLV+YVDDILLIGNDVG+LTD+K WLA QFQ
Subjt:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQ

Query:  MKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSVG
        MKDLG AQYVLGIQI+R+RKNKTLA+SQ +YIDK+L RY MQNSKKGLLP+ +G+HLSKEQ PKTPQEVEDM  I YA A+GSLMYAMLCT PDICY+VG
Subjt:  MKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSVG

Query:  IVSRYQSNLGRDHWTVVKNILNILEEQK
        IVSRYQSN G DHWT VK +L  L   +
Subjt:  IVSRYQSNLGRDHWTVVKNILNILEEQK

TYK03644.1 gag/pol protein [Cucumis melo var. makuwa]3.3e-16288.41Show/hide
Query:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE
        MESMYSNSVWTLVDQ NDVKPIGCKWIYKRKRDQAGKVQTFKARLV KGYTQKEGI+Y E FS  AMIKSIRILLSI TFYDYEIWQMDVKT FLN +LE
Subjt:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE

Query:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQ
        ESIYMVQPE FIQKGQEQ +CKLQKSIYGLKQASRS NIRFDTAIKSYG EQNVDEPCVYKRI+NSTVAFLV+YVDDILLIGNDVGHL DIKKWLA QFQ
Subjt:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQ

Query:  MKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSVG
        MKDLGNAQYVLG+QIVRNRKNKTLAMSQTSYIDKMLSRYKM NSKKGLLPY YGIHLSKEQCPKTPQEVEDMSNI YA A+GSLMY MLCT P+ICYSVG
Subjt:  MKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSVG

Query:  IVSRYQSNLGRDHWTVVKNILNILEEQK
        IVSR QS  GRDHWT VKNIL  L   K
Subjt:  IVSRYQSNLGRDHWTVVKNILNILEEQK

TrEMBL top hitse value%identityAlignment
A0A5A7TTA2 Gag/pol protein1.5e-15790.2Show/hide
Query:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE
        MESMYSNSVWTLVDQ N+++PIGCKWIYKRKRDQ  KVQTF+ARLV KGYTQKEGI+Y ETFSP+AMIKSIRILLSI TFYDYEIWQMDVKTAFLN +LE
Subjt:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE

Query:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQ
        ESIYMVQPEGFIQKGQEQ VCKLQKSIYGLKQASRSWNIRFDT IKSYGFEQNVDEPCVYKRIINSTVAFLV+YVDDILLIGN+V HLTDIK+WL TQFQ
Subjt:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQ

Query:  MKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSVG
        MKDLG+AQYVLGIQIV+NRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPY YGIHLSKEQCPKTPQEV+DMSNI YA A+GSLMYAMLC  PDICYSVG
Subjt:  MKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSVG

Query:  IVSRYQ
        IVSRYQ
Subjt:  IVSRYQ

A0A5A7TZD0 Gag/pol protein2.4e-15079.88Show/hide
Query:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE
        MESMY NSVW LVD    VKPIGCKWIYKRKRD AGKVQTFKARLV KGYTQ+EG++Y ETFSPVAM+KSIRILLSI TFYDYEIWQMDVKTAFLN +LE
Subjt:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE

Query:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQ
        ESI+M QPEGFI +GQEQ VCKL +SIYGLKQASRSWNIRFDTAIKSYGF+QNVDEPCVYK+I    VAFLV+YVDDILLIGNDVG+LTD+K WLA QFQ
Subjt:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQ

Query:  MKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSVG
        MKDLG AQYVLGIQI+R+RKNKTLA+SQ +YIDK+L RY MQNSKKGLLP+ +G+HLSKEQ PKTPQEVEDM  I YA A+GSLMYAMLCT PDICY+VG
Subjt:  MKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSVG

Query:  IVSRYQSNLGRDHWTVVKNILNILEEQK
        IVSRYQSN G DHWT VK +L  L   +
Subjt:  IVSRYQSNLGRDHWTVVKNILNILEEQK

A0A5A7UYE8 Gag/pol protein2.4e-15079.88Show/hide
Query:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE
        MESMY NSVW LVD    VKPIGCKWIYKRKRD AGKVQTFKARLV KGYTQ+EG++Y ETFSPVAM+KSIRILLSI TFYDYEIWQMDVKTAFLN +LE
Subjt:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE

Query:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQ
        ESI+M QPEGFI +GQEQ VCKL +SIYGLKQASRSWNIRFDTAIKSYGF+QNVDEPCVYK+I    VAFLV+YVDDILLIGNDVG+LTD+K WLA QFQ
Subjt:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQ

Query:  MKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSVG
        MKDLG AQYVLGIQI+R+RKNKTLA+SQ +YIDK+L RY MQNSKKGLLP+ +G+HLSKEQ PKTPQEVEDM  I YA A+GSLMYAMLCT PDICY+VG
Subjt:  MKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSVG

Query:  IVSRYQSNLGRDHWTVVKNILNILEEQK
        IVSRYQSN G DHWT VK +L  L   +
Subjt:  IVSRYQSNLGRDHWTVVKNILNILEEQK

A0A5D3BX45 Gag/pol protein1.6e-16288.41Show/hide
Query:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE
        MESMYSNSVWTLVDQ NDVKPIGCKWIYKRKRDQAGKVQTFKARLV KGYTQKEGI+Y E FS  AMIKSIRILLSI TFYDYEIWQMDVKT FLN +LE
Subjt:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE

Query:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQ
        ESIYMVQPE FIQKGQEQ +CKLQKSIYGLKQASRS NIRFDTAIKSYG EQNVDEPCVYKRI+NSTVAFLV+YVDDILLIGNDVGHL DIKKWLA QFQ
Subjt:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQ

Query:  MKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSVG
        MKDLGNAQYVLG+QIVRNRKNKTLAMSQTSYIDKMLSRYKM NSKKGLLPY YGIHLSKEQCPKTPQEVEDMSNI YA A+GSLMY MLCT P+ICYSVG
Subjt:  MKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSVG

Query:  IVSRYQSNLGRDHWTVVKNILNILEEQK
        IVSR QS  GRDHWT VKNIL  L   K
Subjt:  IVSRYQSNLGRDHWTVVKNILNILEEQK

E2GK51 Gag/pol protein (Fragment)3.0e-16184.64Show/hide
Query:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE
        MESMY NSVWTLVD  +DVKPIGCKWIYKRKRDQAGKVQTFKARLV KGYTQKEG++Y ETFSPVAM+KSIRILLSI TFY+YEIWQMDVKTAFLN +LE
Subjt:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE

Query:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQ
        ESIYMVQPEGFI + QEQ VCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYK+I+NS VAFL++YVDDILLIGNDV +LTD+KKWL TQFQ
Subjt:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQ

Query:  MKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSVG
        MKDLG AQY+LGIQIVRNRKNKTLAMSQ SYIDK+LSRYKMQNSKKG LP+ +GIHLSKEQCPKTPQEVEDM NI Y+ A+GSLMYAMLCT PDICYSVG
Subjt:  MKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSVG

Query:  IVSRYQSNLGRDHWTVVKNILNILEEQKTTCL
        IVSRYQSN GRDHWT VKNIL  L   +   L
Subjt:  IVSRYQSNLGRDHWTVVKNILNILEEQKTTCL

SwissProt top hitse value%identityAlignment
P04146 Copia protein5.2e-5436.81Show/hide
Query:  NSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLEESIYMV
        N+ WT+  +  +   +  +W++  K ++ G    +KARLV +G+TQK  I+Y ETF+PVA I S R +LS+V  Y+ ++ QMDVKTAFLN +L+E IYM 
Subjt:  NSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLEESIYMV

Query:  QPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVY---KRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQMKD
         P+G        NVCKL K+IYGLKQA+R W   F+ A+K   F  +  + C+Y   K  IN  + ++++YVDD+++   D+  + + K++L  +F+M D
Subjt:  QPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVY---KRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQMKD

Query:  LGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLP----YIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSV
        L   ++ +GI+I    +   + +SQ++Y+ K+LS++ M+N      P      Y +  S E C           N      IG LMY MLCT PD+  +V
Subjt:  LGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLP----YIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSV

Query:  GIVSRYQSNLGRDHWTVVKNILNILE
         I+SRY S    + W  +K +L  L+
Subjt:  GIVSRYQSNLGRDHWTVVKNILNILE

P10978 Retrovirus-related Pol polyprotein from transposon TNT 1-945.2e-8647.01Show/hide
Query:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE
        MES+  N  + LV+     +P+ CKW++K K+D   K+  +KARLVVKG+ QK+GI+++E FSPV  + SIR +LS+    D E+ Q+DVKTAFL+  LE
Subjt:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLE

Query:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVY-KRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQF
        E IYM QPEGF   G++  VCKL KS+YGLKQA R W ++FD+ +KS  + +   +PCVY KR   +    L++YVDD+L++G D G +  +K  L+  F
Subjt:  ESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVY-KRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQF

Query:  QMKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSV
         MKDLG AQ +LG++IVR R ++ L +SQ  YI+++L R+ M+N+K    P    + LSK+ CP T +E  +M+ + Y+ A+GSLMYAM+CT PDI ++V
Subjt:  QMKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSV

Query:  GIVSRYQSNLGRDHWTVVKNILNILEEQKTTCLC
        G+VSR+  N G++HW  VK IL  L      CLC
Subjt:  GIVSRYQSNLGRDHWTVVKNILNILEEQKTTCLC

P25600 Putative transposon Ty5-1 protein YCL074W2.8e-2329.8Show/hide
Query:  MDVKTAFLNRSLEESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGH
        MDV TAFLN +++E IY+ QP GF+ +     V +L   +YGLKQA   WN   +  +K  GF ++  E  +Y R  +    ++ +YVDD+L+       
Subjt:  MDVKTAFLNRSLEESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGH

Query:  LTDIKKWLATQFQMKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYA
           +K+ L   + MKDLG     LG+ I     N  + +S   YI K  S  ++   K    P    +  SK     T   ++D++   Y   +G L++ 
Subjt:  LTDIKKWLATQFQMKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYA

Query:  MLCTIPDICYSVGIVSRYQSNLGRDHWTVVKNILNILEEQKTTCL
             PDI Y V ++SR+       H    + +L  L   ++ CL
Subjt:  MLCTIPDICYSVGIVSRYQSNLGRDHWTVVKNILNILEEQKTTCL

Q94HW2 Retrovirus-related Pol polyprotein from transposon RE12.1e-4735.38Show/hide
Query:  MESMYSNSVWTLV-DQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSL
        + +   N  W LV    + V  +GC+WI+ +K +  G +  +KARLV KGY Q+ G++Y ETFSPV    SIRI+L +     + I Q+DV  AFL  +L
Subjt:  MESMYSNSVWTLV-DQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSL

Query:  EESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQF
         + +YM QP GFI K +   VCKL+K++YGLKQA R+W +     + + GF  +V +  ++      ++ ++++YVDDIL+ GND   L +    L+ +F
Subjt:  EESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQF

Query:  QMKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSV
         +KD     Y LGI+    R    L +SQ  YI  +L+R  M  +K    P      LS     K     E      Y   +GSL Y +  T PDI Y+V
Subjt:  QMKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSV

Query:  GIVSRYQSNLGRDHWTVVKNILNIL
          +S++      +H   +K IL  L
Subjt:  GIVSRYQSNLGRDHWTVVKNILNIL

Q9ZT94 Retrovirus-related Pol polyprotein from transposon RE21.7e-4934.77Show/hide
Query:  MESMYSNSVWTLV-DQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSL
        + +   N  W LV      V  +GC+WI+ +K +  G +  +KARLV KGY Q+ G++Y ETFSPV    SIRI+L +     + I Q+DV  AFL  +L
Subjt:  MESMYSNSVWTLV-DQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSL

Query:  EESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQF
         + +YM QP GF+ K +   VC+L+K+IYGLKQA R+W +   T + + GF  ++ +  ++      ++ ++++YVDDIL+ GND   L      L+ +F
Subjt:  EESIYMVQPEGFIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQF

Query:  QMKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSV
         +K+  +  Y LGI+    R  + L +SQ  Y   +L+R  M  +K    P      L+     K P   E      Y   +GSL Y +  T PD+ Y+V
Subjt:  QMKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSV

Query:  GIVSRYQSNLGRDHWTVVKNILNIL
          +S+Y      DHW  +K +L  L
Subjt:  GIVSRYQSNLGRDHWTVVKNILNIL

Arabidopsis top hitse value%identityAlignment
AT4G23160.1 cysteine-rich RLK (RECEPTOR-like protein kinase) 84.4e-4832.42Show/hide
Query:  SMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLEES
        +M +   W +     + KPIGCKW+YK K +  G ++ +KARLV KGYTQ+EGI++ ETFSPV  + S++++L+I   Y++ + Q+D+  AFLN  L+E 
Subjt:  SMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLEES

Query:  IYMVQPEGFIQKGQE----QNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQ
        IYM  P G+  +  +      VC L+KSIYGLKQASR W ++F   +  +GF Q+  +   + +I  +    +++YVDDI++  N+   + ++K  L + 
Subjt:  IYMVQPEGFIQKGQE----QNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQ

Query:  FQMKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYS
        F+++DLG  +Y LG++I R+     + + Q  Y   +L    +   K   +P    +  S           + +   +Y   IG LMY  +  + DI ++
Subjt:  FQMKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYS

Query:  VGIVSRYQSNLGRDHWTVVKNILNILE
        V  +S++       H   V  IL+ ++
Subjt:  VGIVSRYQSNLGRDHWTVVKNILNILE

ATMG00810.1 DNA/RNA polymerases superfamily protein1.1e-0932.69Show/hide
Query:  FLVMYVDDILLIGNDVGHLTDIKKWLATQFQMKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEV
        +L++YVDDILL G+    L  +   L++ F MKDLG   Y LGIQI  +     L +SQT Y +++L+   M + K    P    ++ S     K P + 
Subjt:  FLVMYVDDILLIGNDVGHLTDIKKWLATQFQMKDLGNAQYVLGIQIVRNRKNKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEV

Query:  EDMSNISYAFAIGSLMYAMLCTIPDICYSVGIVSRYQSNLGRDHWTVVKNILNILE
         D  +I     +G+L Y  L T PDI Y+V IV +         + ++K +L  ++
Subjt:  EDMSNISYAFAIGSLMYAMLCTIPDICYSVGIVSRYQSNLGRDHWTVVKNILNILE

ATMG00820.1 Reverse transcriptase (RNA-dependent DNA polymerase)1.9e-1138.96Show/hide
Query:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSI
        ++++  N  W LV    +   +GCKW++K K    G +   KARLV KG+ Q+EGI + ET+SPV    +IR +L++
Subjt:  MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSI


Sequences Show/hide sequences
CDS sequenceShow/hide CDS sequence
ATGGAATCTATGTATTCCAATTCTGTCTGGACTCTAGTAGATCAACAAAATGATGTAAAACCTATTGGTTGTAAATGGATCTACAAGAGAAAACGAGATCAAGCTGGTAA
AGTACAGACTTTTAAAGCTCGACTAGTGGTAAAAGGTTATACACAAAAGGAGGGAATAAATTATAATGAAACTTTCTCTCCTGTTGCCATGATAAAGTCGATTAGAATAC
TCTTATCCATCGTCACTTTTTATGATTATGAAATTTGGCAGATGGATGTCAAGACAGCCTTTTTGAATAGAAGTCTTGAAGAGAGTATCTATATGGTCCAACCAGAGGGG
TTCATACAAAAGGGTCAAGAACAAAATGTTTGTAAGCTTCAAAAATCTATTTATGGATTGAAACAAGCATCTAGATCCTGGAATATAAGATTTGATACTGCGATCAAATC
TTATGGTTTTGAACAGAATGTTGATGAACCCTGTGTTTACAAAAGGATCATCAATTCTACTGTAGCATTCTTAGTTATGTATGTAGATGATATTCTACTCATTGGGAATG
ATGTAGGTCATCTAACTGATATTAAGAAATGGCTAGCTACGCAATTCCAAATGAAAGATTTGGGAAATGCACAATATGTTCTTGGCATCCAAATAGTTCGGAACCGAAAG
AACAAAACTCTAGCCATGTCTCAAACATCTTATATAGACAAAATGTTGTCAAGATATAAGATGCAGAATTCCAAAAAAGGTCTGTTGCCGTACATATATGGAATTCATTT
ATCAAAAGAACAATGTCCAAAGACACCTCAAGAAGTTGAGGATATGAGTAACATTTCCTATGCTTTTGCTATTGGGAGCCTGATGTATGCAATGTTATGTACTATACCTG
ACATTTGCTATTCCGTGGGAATAGTTAGTAGATATCAGTCCAATCTTGGACGTGATCATTGGACAGTCGTTAAGAATATTCTAAATATCTTAGAAGAACAAAAGACTACA
TGCTTGTGTATGGTTCTAAGGTTCTGA
mRNA sequenceShow/hide mRNA sequence
ATGGAATCTATGTATTCCAATTCTGTCTGGACTCTAGTAGATCAACAAAATGATGTAAAACCTATTGGTTGTAAATGGATCTACAAGAGAAAACGAGATCAAGCTGGTAA
AGTACAGACTTTTAAAGCTCGACTAGTGGTAAAAGGTTATACACAAAAGGAGGGAATAAATTATAATGAAACTTTCTCTCCTGTTGCCATGATAAAGTCGATTAGAATAC
TCTTATCCATCGTCACTTTTTATGATTATGAAATTTGGCAGATGGATGTCAAGACAGCCTTTTTGAATAGAAGTCTTGAAGAGAGTATCTATATGGTCCAACCAGAGGGG
TTCATACAAAAGGGTCAAGAACAAAATGTTTGTAAGCTTCAAAAATCTATTTATGGATTGAAACAAGCATCTAGATCCTGGAATATAAGATTTGATACTGCGATCAAATC
TTATGGTTTTGAACAGAATGTTGATGAACCCTGTGTTTACAAAAGGATCATCAATTCTACTGTAGCATTCTTAGTTATGTATGTAGATGATATTCTACTCATTGGGAATG
ATGTAGGTCATCTAACTGATATTAAGAAATGGCTAGCTACGCAATTCCAAATGAAAGATTTGGGAAATGCACAATATGTTCTTGGCATCCAAATAGTTCGGAACCGAAAG
AACAAAACTCTAGCCATGTCTCAAACATCTTATATAGACAAAATGTTGTCAAGATATAAGATGCAGAATTCCAAAAAAGGTCTGTTGCCGTACATATATGGAATTCATTT
ATCAAAAGAACAATGTCCAAAGACACCTCAAGAAGTTGAGGATATGAGTAACATTTCCTATGCTTTTGCTATTGGGAGCCTGATGTATGCAATGTTATGTACTATACCTG
ACATTTGCTATTCCGTGGGAATAGTTAGTAGATATCAGTCCAATCTTGGACGTGATCATTGGACAGTCGTTAAGAATATTCTAAATATCTTAGAAGAACAAAAGACTACA
TGCTTGTGTATGGTTCTAAGGTTCTGA
Protein sequenceShow/hide protein sequence
MESMYSNSVWTLVDQQNDVKPIGCKWIYKRKRDQAGKVQTFKARLVVKGYTQKEGINYNETFSPVAMIKSIRILLSIVTFYDYEIWQMDVKTAFLNRSLEESIYMVQPEG
FIQKGQEQNVCKLQKSIYGLKQASRSWNIRFDTAIKSYGFEQNVDEPCVYKRIINSTVAFLVMYVDDILLIGNDVGHLTDIKKWLATQFQMKDLGNAQYVLGIQIVRNRK
NKTLAMSQTSYIDKMLSRYKMQNSKKGLLPYIYGIHLSKEQCPKTPQEVEDMSNISYAFAIGSLMYAMLCTIPDICYSVGIVSRYQSNLGRDHWTVVKNILNILEEQKTT
CLCMVLRF