ID   A0A3Q2I5Q7_HORSE        Unreviewed;      1192 AA.
AC   A0A3Q2I5Q7;
DT   10-APR-2019, integrated into UniProtKB/TrEMBL.
DT   10-APR-2019, sequence version 1.
DT   02-JUN-2021, entry version 13.
DE   RecName: Full=Receptor protein-tyrosine kinase {ECO:0000256|ARBA:ARBA00011902};
DE            EC=2.7.10.1 {ECO:0000256|ARBA:ARBA00011902};
GN   Name=EGFR {ECO:0000313|Ensembl:ENSECAP00000043331,
GN   ECO:0000313|VGNC:VGNC:17460};
OS   Equus caballus (Horse).
OC   Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi; Mammalia;
OC   Eutheria; Laurasiatheria; Perissodactyla; Equidae; Equus.
OX   NCBI_TaxID=9796 {ECO:0000313|Ensembl:ENSECAP00000043331, ECO:0000313|Proteomes:UP000002281};
RN   [1] {ECO:0000313|Ensembl:ENSECAP00000043331, ECO:0000313|Proteomes:UP000002281}
RP   NUCLEOTIDE SEQUENCE [LARGE SCALE GENOMIC DNA].
RC   STRAIN=Thoroughbred {ECO:0000313|Ensembl:ENSECAP00000043331,
RC   ECO:0000313|Proteomes:UP000002281};
RX   PubMed=19892987; DOI=10.1126/science.1178158;
RG   Broad Institute Genome Sequencing Platform;
RG   Broad Institute Whole Genome Assembly Team;
RA   Wade C.M., Giulotto E., Sigurdsson S., Zoli M., Gnerre S., Imsland F.,
RA   Lear T.L., Adelson D.L., Bailey E., Bellone R.R., Bloecker H., Distl O.,
RA   Edgar R.C., Garber M., Leeb T., Mauceli E., MacLeod J.N., Penedo M.C.T.,
RA   Raison J.M., Sharpe T., Vogel J., Andersson L., Antczak D.F., Biagi T.,
RA   Binns M.M., Chowdhary B.P., Coleman S.J., Della Valle G., Fryc S.,
RA   Guerin G., Hasegawa T., Hill E.W., Jurka J., Kiialainen A., Lindgren G.,
RA   Liu J., Magnani E., Mickelson J.R., Murray J., Nergadze S.G., Onofrio R.,
RA   Pedroni S., Piras M.F., Raudsepp T., Rocchi M., Roeed K.H., Ryder O.A.,
RA   Searle S., Skow L., Swinburne J.E., Syvaenen A.C., Tozaki T., Valberg S.J.,
RA   Vaudin M., White J.R., Zody M.C., Lander E.S., Lindblad-Toh K.;
RT   "Genome sequence, comparative analysis, and population genetics of the
RT   domestic horse.";
RL   Science 326:865-867(2009).
RN   [2] {ECO:0000313|Ensembl:ENSECAP00000043331}
RP   IDENTIFICATION.
RC   STRAIN=Thoroughbred {ECO:0000313|Ensembl:ENSECAP00000043331};
RG   Ensembl;
RL   Submitted (JAN-2019) to UniProtKB.
CC   -!- CATALYTIC ACTIVITY:
CC       Reaction=ATP + L-tyrosyl-[protein] = ADP + H(+) + O-phospho-L-tyrosyl-
CC         [protein]; Xref=Rhea:RHEA:10596, Rhea:RHEA-COMP:10136, Rhea:RHEA-
CC         COMP:10137, ChEBI:CHEBI:15378, ChEBI:CHEBI:30616, ChEBI:CHEBI:46858,
CC         ChEBI:CHEBI:82620, ChEBI:CHEBI:456216; EC=2.7.10.1;
CC         Evidence={ECO:0000256|ARBA:ARBA00001171};
CC   -!- SUBCELLULAR LOCATION: Membrane {ECO:0000256|ARBA:ARBA00004479}; Single-
CC       pass type I membrane protein {ECO:0000256|ARBA:ARBA00004479}.
CC   ---------------------------------------------------------------------------
CC   Copyrighted by the UniProt Consortium, see https://www.uniprot.org/terms
CC   Distributed under the Creative Commons Attribution (CC BY 4.0) License
CC   ---------------------------------------------------------------------------
DR   Ensembl; ENSECAT00000042132; ENSECAP00000043331; ENSECAG00000009952.
DR   VGNC; VGNC:17460; EGFR.
DR   GeneTree; ENSGT00940000155450; -.
DR   OMA; PECKGCT; -.
DR   Proteomes; UP000002281; Chromosome 4.
DR   ExpressionAtlas; A0A3Q2I5Q7; baseline.
DR   GO; GO:0016021; C:integral component of membrane; IEA:UniProtKB-KW.
DR   GO; GO:0005524; F:ATP binding; IEA:UniProtKB-UniRule.
DR   GO; GO:0004714; F:transmembrane receptor protein tyrosine kinase activity; IEA:UniProtKB-EC.
DR   GO; GO:0007169; P:transmembrane receptor protein tyrosine kinase signaling pathway; IEA:InterPro.
DR   CDD; cd00064; FU; 3.
DR   Gene3D; 3.80.20.20; -; 2.
DR   InterPro; IPR006211; Furin-like_Cys-rich_dom.
DR   InterPro; IPR006212; Furin_repeat.
DR   InterPro; IPR032778; GF_recep_IV.
DR   InterPro; IPR009030; Growth_fac_rcpt_cys_sf.
DR   InterPro; IPR011009; Kinase-like_dom_sf.
DR   InterPro; IPR000719; Prot_kinase_dom.
DR   InterPro; IPR017441; Protein_kinase_ATP_BS.
DR   InterPro; IPR000494; Rcpt_L-dom.
DR   InterPro; IPR036941; Rcpt_L-dom_sf.
DR   InterPro; IPR001245; Ser-Thr/Tyr_kinase_cat_dom.
DR   InterPro; IPR008266; Tyr_kinase_AS.
DR   InterPro; IPR020635; Tyr_kinase_cat_dom.
DR   InterPro; IPR016245; Tyr_kinase_EGF/ERB/XmrK_rcpt.
DR   Pfam; PF00757; Furin-like; 1.
DR   Pfam; PF14843; GF_recep_IV; 1.
DR   Pfam; PF07714; PK_Tyr_Ser-Thr; 1.
DR   Pfam; PF01030; Recep_L_domain; 2.
DR   PIRSF; PIRSF000619; TyrPK_EGF-R; 2.
DR   PRINTS; PR00109; TYRKINASE.
DR   SMART; SM00261; FU; 4.
DR   SMART; SM00219; TyrKc; 1.
DR   SUPFAM; SSF56112; SSF56112; 1.
DR   SUPFAM; SSF57184; SSF57184; 2.
DR   PROSITE; PS00107; PROTEIN_KINASE_ATP; 1.
DR   PROSITE; PS50011; PROTEIN_KINASE_DOM; 1.
DR   PROSITE; PS00109; PROTEIN_KINASE_TYR; 1.
PE   4: Predicted;
KW   ATP-binding {ECO:0000256|ARBA:ARBA00022840, ECO:0000256|PIRSR:PIRSR000619-
KW   2}; Kinase {ECO:0000256|ARBA:ARBA00022777};
KW   Membrane {ECO:0000256|ARBA:ARBA00023136, ECO:0000256|SAM:Phobius};
KW   Nucleotide-binding {ECO:0000256|ARBA:ARBA00022741, ECO:0000256|PROSITE-
KW   ProRule:PRU10141}; Phosphoprotein {ECO:0000256|ARBA:ARBA00022553};
KW   Receptor {ECO:0000256|ARBA:ARBA00023170};
KW   Reference proteome {ECO:0000313|Proteomes:UP000002281};
KW   Signal {ECO:0000256|SAM:SignalP};
KW   Transferase {ECO:0000256|ARBA:ARBA00022679};
KW   Transmembrane {ECO:0000256|ARBA:ARBA00022692, ECO:0000256|SAM:Phobius};
KW   Transmembrane helix {ECO:0000256|ARBA:ARBA00022989,
KW   ECO:0000256|SAM:Phobius};
KW   Tyrosine-protein kinase {ECO:0000256|ARBA:ARBA00023137}.
FT   SIGNAL          1..24
FT                   /evidence="ECO:0000256|SAM:SignalP"
FT   CHAIN           25..1192
FT                   /note="Receptor protein-tyrosine kinase"
FT                   /evidence="ECO:0000256|SAM:SignalP"
FT                   /id="PRO_5018752115"
FT   TRANSMEM        646..668
FT                   /note="Helical"
FT                   /evidence="ECO:0000256|SAM:Phobius"
FT   DOMAIN          712..979
FT                   /note="Protein kinase"
FT                   /evidence="ECO:0000259|PROSITE:PS50011"
FT   NP_BIND         718..726
FT                   /note="ATP"
FT                   /evidence="ECO:0000256|PIRSR:PIRSR000619-2"
FT   REGION          1078..1122
FT                   /note="Disordered"
FT                   /evidence="ECO:0000256|SAM:MobiDB-lite"
FT   COMPBIAS        1081..1095
FT                   /note="Polar residues"
FT                   /evidence="ECO:0000256|SAM:MobiDB-lite"
FT   ACT_SITE        837
FT                   /note="Proton acceptor"
FT                   /evidence="ECO:0000256|PIRSR:PIRSR000619-1"
FT   BINDING         745
FT                   /note="ATP"
FT                   /evidence="ECO:0000256|PIRSR:PIRSR000619-2,
FT                   ECO:0000256|PROSITE-ProRule:PRU10141"
SQ   SEQUENCE   1192 AA;  132850 MW;  A131BB33E5064309 CRC64;
     MRHSGTVGAA LLVLLAAYFQ ASPALEEKKV CQGTSNRLTQ LGTFEDHFLS LQRMFNNCEV
     VLGNLEITYM QKNYDLSFLK TIQEVAGYVL IALNTVEKIP LENLQIIRGN VLYENTHALS
     VLSNYGANKV GLRELPMRNL QEILQGAVRF SNNPILCNME TIQWRDIVNS DFLSNMSVDF
     QNQLGSCQKC DPACPNGSCW GVGKENCQKL TKTICAQQCS GRCRGRSPSD CCHNQCAAGC
     TGPRESDCLV CRKFRDEATC KDTCPPLMLY NPTTYQMDVN PDGKYSFGAT CVKKCPRNYV
     VTDHGSCVRA CSSDSYEVEE DGVRKCKKCE GPCRKVCNGI GIGEFKDTLS INATNIKHFK
     NCTSISGDLH ILPVAFRGDS FTRTPPLDPK ELDILQTVKE ITGFLLIQAW PENRTDLHAF
     ENLEIIRGRT KQHGQFSLAV VGLDITSLGL RSLKEISDGD VIISGNRNLC YANTIKWKKL
     FGTSSQKTKI INNRSEKDCK TVGHVCNLLC SSEGCWGPEP RDCVSCQNVS RGKECVEKCN
     ILEGEPREFV ENSECIQCHP ECLPQAMNIT CTGRGPDNCI KCAHYIDGPH CVKTCPSGIM
     GENNTLVWKF ADANHVCHLC HPNCTYGCAG PGLEGCARNG PKIPSIATGI VGGLLLVVVV
     ALGIGLFLRR RHIVRKRTLR RLLQERELVE PLTPSGEAPN QALLRILKET EFKKIKVLGS
     GAFGTVYKGL WIPEGEKVKI PVAIKELREA TSPKANKEIL DEAYVMASVD NPHVCRLLGI
     CLTSTVQLIT QLMPFGCLLD YVREHKDNIG SQYLLNWCVQ IAKGMNYLED RRLVHRDLAA
     RNVLVKTPQH VKITDFGLAK LLGAEEKEYH AEGGKVPIKW MALESILHRI YTHQSDVWSY
     GVTVWELMTF GSKPYDGIPA SEISTILEKG ERLPQPPICT IDVYMIMVKC WMIDADSRPK
     FRELIIEFSK MARDPQRYLV IQGDERMHLP SPTDSNFYRT LMDEEDMEDV VDADEYLIPQ
     QGFFHSPSTS RTPLISSLSC PLKEDSFLQR YSSDPTGTVT EDNIDDTFLP APEYVNQSVP
     KRPAGSVQNP VYHNQPLNPA PGRDPHYQNP HSNAMDNPEY LNTTHPDCVN SVLDGTALWA
     QKGNHQISLD NPDYQQDFFP KEAKSNGIFK GPAAENAEYL RVAPPSSEFI GA
//