(data stored in ACNUC13479 zone)

EMBL: CP002688.PE74

CP002688.PE74        Location/Qualifiers
FT   CDS             complement(join(162803..163505,163615..163718,
FT                   163809..163892,163996..164040,164121..164192,
FT                   164295..164375,164517..164612,164685..164759,
FT                   164845..164892,164996..165079,165167..165274,
FT                   165352..165385,165470..165669,165790..165888,
FT                   165970..166017,166265..166507,166582..166698,
FT                   166988..167056,167391..167936,168051..168605,
FT                   168711..168830,169035..169206,169645..169813,
FT                   169924..169999,170082..170174,170284..170443,
FT                   170870..171072))
FT                   /codon_start=1
FT                   /gene="ESP4"
FT                   /gene_synonym="ENHANCED SILENCING PHENOTYPE 4"
FT                   /gene_synonym="T10O8.110"
FT                   /gene_synonym="T10O8_110"
FT                   /locus_tag="AT5G01400"
FT                   /product="HEAT repeat-containing protein"
FT                   /note="ENHANCED SILENCING PHENOTYPE 4 (ESP4); FUNCTIONS IN:
FT                   binding; INVOLVED IN: posttranscriptional gene silencing by
FT                   RNA, RNA processing; LOCATED IN: mRNA cleavage and
FT                   polyadenylation specificity factor complex; EXPRESSED IN:
FT                   23 plant structures; EXPRESSED DURING: 13 growth stages;
FT                   CONTAINS InterPro DOMAIN/s: Symplekin tight junction
FT                   protein C-terminal (InterPro:IPR022075), Armadillo-type
FT                   fold (InterPro:IPR016024), Protein of unknown function
FT                   DUF3453 (InterPro:IPR021850); BEST Arabidopsis thaliana
FT                   protein match is: unknown protein (TAIR:AT1G27595.1); Has
FT                   1807 Blast hits to 1807 proteins in 277 species: Archae -
FT                   0; Bacteria - 0; Metazoa - 736; Fungi - 347; Plants - 385;
FT                   Viruses - 0; Other Eukaryotes - 339 (source: NCBI BLink)."
FT                   /db_xref="GOA:Q9M033"
FT                   /db_xref="InterPro:IPR011989"
FT                   /db_xref="InterPro:IPR016024"
FT                   /db_xref="InterPro:IPR022075"
FT                   /db_xref="InterPro:IPR032460"
FT                   /db_xref="UniProtKB/TrEMBL:Q9M033"
FT                   /inference="similar to RNA sequence,
FT                   EST:INSD:ES071419.1,INSD:ES072101.1,INSD:EH859230.1,
FT                   INSD:EH825985.1,INSD:AV545988.1,INSD:AV529152.1,
FT                   INSD:AV546483.1,INSD:DR383177.1,INSD:DR275772.1,
FT                   INSD:DR275773.1,INSD:T45463.1,INSD:AA394514.1,
FT                   INSD:ES017155.1,INSD:AV539512.1"
FT                   /protein_id="AED90339.1"
FT                   /translation="MASYSRARLKDLANSAKSATELPPKLQRLRYMRRDLQKDDSVFPT
FT                   ELLPHLFDLLSDQFGAVRKFVAEILGEIGLKYVELIPEIVPLLIKSLEDETPAVARQVI
FT                   ACGADLFRSTLERVAVQGLHSSELNDLLESSWTWLIKFKDEICSVAFKQGNSGVKLCAM
FT                   KFVEALILLYTPHEGIEADFNISILRGGHPVLKIGDLSIEASQKLGLLLDQLRHPAAKS
FT                   LNSSTIIVLINSLSSVAKKRPAYCGRILPVLLSLDPLSFLKGVYAAATNLALKTVFLSC
FT                   LKCTHPAAAPDRLTSALKEIEGGGQAAKAKDLFYKTNGSIQDKDSVEDTKVSVEENPLC
FT                   ASSDVAESNLSRKRSGSEYNIDLNGDASDGKRARITPSVSEESTDGLNGNDGVSLPRVA
FT                   STSTGPSDSRGVSDSGPAQQLVGLFGTLVSQGEKAIGSLEILISSISADLLTDVVMANM
FT                   HNIPPNCSSYADGTDELVMNMCIVGSDAQIKYPPSFVAGVLSLSTAFPPIAALINPHNE
FT                   DEEVYSVHVDQQMFPAEDARTPPGLLATCDTSFPENEESNTVSPQNVHYIGNRESGIPG
FT                   LESSAQHDGSGALVTNVLSSTNVEAASKNQNASFSGKLLVDVIPSMSVDKLEEFSPKAV
FT                   GTVASASQFVLPKISAPVVDLSDEEKDSLQKLVFLRIVEAYKQISMSGGSQLRFSLLAH
FT                   LGVEFPSELDPWKILQEHVLSDYLNHEGHELTVRVLYRLYGEAEAEQDFFSSTTAASAY
FT                   ESFLLTVAEALRDSFPPSDKSLSKLLGDSPHLPKSVLMLLESFCCPGSGEVEKDLQHGD
FT                   RVTQGLSAVWSLILMRPGIRNDCLNIALQSAVHHLEEIRMKAIRLVANKLYSLSFITEQ
FT                   IEEFAKDRLFSVVSDDCDKMDLDLKSPPNKPQHSISGMSMETPSEATSSSTSVTEAQRC
FT                   LSLYFALCTKVLRIFTILRLMTNLVFNIYKNASDPVKQAIHLQIPILVRTMGSSSELLK
FT                   IIADPPSGSDNLLIQVLQTLTEGPTPSSELILTIRKLFDTRIKDVEILFPILPFLPRDD
FT                   VLRIFPHMVNLPMEKFQVALSRVLQGSSQSGPVLSPSEALIAIHSIDPARDGIPLKQVT
FT                   DACNTCFAQRQTFTQQVLAGVLNQLVQQIPLPMLFMRTVLQAIGAFPALSDFILEILSR
FT                   LVSKQIWKYPKLWVGFLKCTQTTQPQSYKVLLQLPPLQLGNALTKIPALRAPLTAHASQ
FT                   PEIQSSLPRSTLAVLGLVPDSQGTQTSQVQANETQTSQEQQQQQASEPQQTSQSQQVSV
FT                   PLSHSQVDHQEPSQVVASQSQSSPIGTVQSAMSQSQNSPIDTGRSEMSQSQNSPIDTGR
FT                   SEMSQSQNSPIDTGRSEMSQSQNSPIDTGRSEMSESQSSPIGQSQSSPIGTGQSDMSQT
FT                   PQVSDSSAPEPTSHTRTSDPQASSQTLRDDDEKIDDTATSENEVTEIEKSKESSEEEEE
FT                   EEEEEE"
     MASYSRARLK DLANSAKSAT ELPPKLQRLR YMRRDLQKDD SVFPTELLPH LFDLLSDQFG        60
     AVRKFVAEIL GEIGLKYVEL IPEIVPLLIK SLEDETPAVA RQVIACGADL FRSTLERVAV       120
     QGLHSSELND LLESSWTWLI KFKDEICSVA FKQGNSGVKL CAMKFVEALI LLYTPHEGIE       180
     ADFNISILRG GHPVLKIGDL SIEASQKLGL LLDQLRHPAA KSLNSSTIIV LINSLSSVAK       240
     KRPAYCGRIL PVLLSLDPLS FLKGVYAAAT NLALKTVFLS CLKCTHPAAA PDRLTSALKE       300
     IEGGGQAAKA KDLFYKTNGS IQDKDSVEDT KVSVEENPLC ASSDVAESNL SRKRSGSEYN       360
     IDLNGDASDG KRARITPSVS EESTDGLNGN DGVSLPRVAS TSTGPSDSRG VSDSGPAQQL       420
     VGLFGTLVSQ GEKAIGSLEI LISSISADLL TDVVMANMHN IPPNCSSYAD GTDELVMNMC       480
     IVGSDAQIKY PPSFVAGVLS LSTAFPPIAA LINPHNEDEE VYSVHVDQQM FPAEDARTPP       540
     GLLATCDTSF PENEESNTVS PQNVHYIGNR ESGIPGLESS AQHDGSGALV TNVLSSTNVE       600
     AASKNQNASF SGKLLVDVIP SMSVDKLEEF SPKAVGTVAS ASQFVLPKIS APVVDLSDEE       660
     KDSLQKLVFL RIVEAYKQIS MSGGSQLRFS LLAHLGVEFP SELDPWKILQ EHVLSDYLNH       720
     EGHELTVRVL YRLYGEAEAE QDFFSSTTAA SAYESFLLTV AEALRDSFPP SDKSLSKLLG       780
     DSPHLPKSVL MLLESFCCPG SGEVEKDLQH GDRVTQGLSA VWSLILMRPG IRNDCLNIAL       840
     QSAVHHLEEI RMKAIRLVAN KLYSLSFITE QIEEFAKDRL FSVVSDDCDK MDLDLKSPPN       900
     KPQHSISGMS METPSEATSS STSVTEAQRC LSLYFALCTK VLRIFTILRL MTNLVFNIYK       960
     NASDPVKQAI HLQIPILVRT MGSSSELLKI IADPPSGSDN LLIQVLQTLT EGPTPSSELI      1020
     LTIRKLFDTR IKDVEILFPI LPFLPRDDVL RIFPHMVNLP MEKFQVALSR VLQGSSQSGP      1080
     VLSPSEALIA IHSIDPARDG IPLKQVTDAC NTCFAQRQTF TQQVLAGVLN QLVQQIPLPM      1140
     LFMRTVLQAI GAFPALSDFI LEILSRLVSK QIWKYPKLWV GFLKCTQTTQ PQSYKVLLQL      1200
     PPLQLGNALT KIPALRAPLT AHASQPEIQS SLPRSTLAVL GLVPDSQGTQ TSQVQANETQ      1260
     TSQEQQQQQA SEPQQTSQSQ QVSVPLSHSQ VDHQEPSQVV ASQSQSSPIG TVQSAMSQSQ      1320
     NSPIDTGRSE MSQSQNSPID TGRSEMSQSQ NSPIDTGRSE MSQSQNSPID TGRSEMSESQ      1380
     SSPIGQSQSS PIGTGQSDMS QTPQVSDSSA PEPTSHTRTS DPQASSQTLR DDDEKIDDTA      1440
     TSENEVTEIE KSKESSEEEE EEEEEEE                                          1467
//

If you have problems or comments...

PBIL Back to PBIL home page