ID   A0A3Q2I5Q7_HORSE        Unreviewed;      1192 AA.
AC   A0A3Q2I5Q7;
DT   10-APR-2019, integrated into UniProtKB/TrEMBL.
DT   10-APR-2019, sequence version 1.
DT   12-OCT-2022, entry version 18.
DE   RecName: Full=Receptor protein-tyrosine kinase {ECO:0000256|ARBA:ARBA00011902, ECO:0000256|PIRNR:PIRNR000619};
DE            EC=2.7.10.1 {ECO:0000256|ARBA:ARBA00011902, ECO:0000256|PIRNR:PIRNR000619};
GN   Name=EGFR {ECO:0000313|Ensembl:ENSECAP00000043331,
GN   ECO:0000313|VGNC:VGNC:17460};
OS   Equus caballus (Horse).
OC   Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi; Mammalia;
OC   Eutheria; Laurasiatheria; Perissodactyla; Equidae; Equus.
OX   NCBI_TaxID=9796 {ECO:0000313|Ensembl:ENSECAP00000043331, ECO:0000313|Proteomes:UP000002281};
RN   [1] {ECO:0000313|Ensembl:ENSECAP00000043331, ECO:0000313|Proteomes:UP000002281}
RP   NUCLEOTIDE SEQUENCE [LARGE SCALE GENOMIC DNA].
RC   STRAIN=Thoroughbred {ECO:0000313|Ensembl:ENSECAP00000043331,
RC   ECO:0000313|Proteomes:UP000002281};
RX   PubMed=19892987; DOI=10.1126/science.1178158;
RG   Broad Institute Genome Sequencing Platform;
RG   Broad Institute Whole Genome Assembly Team;
RA   Wade C.M., Giulotto E., Sigurdsson S., Zoli M., Gnerre S., Imsland F.,
RA   Lear T.L., Adelson D.L., Bailey E., Bellone R.R., Bloecker H., Distl O.,
RA   Edgar R.C., Garber M., Leeb T., Mauceli E., MacLeod J.N., Penedo M.C.T.,
RA   Raison J.M., Sharpe T., Vogel J., Andersson L., Antczak D.F., Biagi T.,
RA   Binns M.M., Chowdhary B.P., Coleman S.J., Della Valle G., Fryc S.,
RA   Guerin G., Hasegawa T., Hill E.W., Jurka J., Kiialainen A., Lindgren G.,
RA   Liu J., Magnani E., Mickelson J.R., Murray J., Nergadze S.G., Onofrio R.,
RA   Pedroni S., Piras M.F., Raudsepp T., Rocchi M., Roeed K.H., Ryder O.A.,
RA   Searle S., Skow L., Swinburne J.E., Syvaenen A.C., Tozaki T., Valberg S.J.,
RA   Vaudin M., White J.R., Zody M.C., Lander E.S., Lindblad-Toh K.;
RT   "Genome sequence, comparative analysis, and population genetics of the
RT   domestic horse.";
RL   Science 326:865-867(2009).
RN   [2] {ECO:0000313|Ensembl:ENSECAP00000043331}
RP   IDENTIFICATION.
RC   STRAIN=Thoroughbred {ECO:0000313|Ensembl:ENSECAP00000043331};
RG   Ensembl;
RL   Submitted (JAN-2019) to UniProtKB.
CC   -!- CATALYTIC ACTIVITY:
CC       Reaction=ATP + L-tyrosyl-[protein] = ADP + H(+) + O-phospho-L-tyrosyl-
CC         [protein]; Xref=Rhea:RHEA:10596, Rhea:RHEA-COMP:10136, Rhea:RHEA-
CC         COMP:10137, ChEBI:CHEBI:15378, ChEBI:CHEBI:30616, ChEBI:CHEBI:46858,
CC         ChEBI:CHEBI:82620, ChEBI:CHEBI:456216; EC=2.7.10.1;
CC         Evidence={ECO:0000256|ARBA:ARBA00001171};
CC   -!- SUBCELLULAR LOCATION: Membrane {ECO:0000256|ARBA:ARBA00004479}; Single-
CC       pass type I membrane protein {ECO:0000256|ARBA:ARBA00004479}.
CC   -!- SIMILARITY: Belongs to the protein kinase superfamily. Tyr protein
CC       kinase family. EGF receptor subfamily. {ECO:0000256|PIRNR:PIRNR000619}.
CC   ---------------------------------------------------------------------------
CC   Copyrighted by the UniProt Consortium, see https://www.uniprot.org/terms
CC   Distributed under the Creative Commons Attribution (CC BY 4.0) License
CC   ---------------------------------------------------------------------------
DR   Ensembl; ENSECAT00000042132.1; ENSECAP00000043331.1; ENSECAG00000009952.3.
DR   VGNC; VGNC:17460; EGFR.
DR   GeneTree; ENSGT00940000155450; -.
DR   Proteomes; UP000002281; Chromosome 4.
DR   Bgee; ENSECAG00000009952; Expressed in trophoblast and 20 other tissues.
DR   ExpressionAtlas; A0A3Q2I5Q7; baseline.
DR   GO; GO:0016021; C:integral component of membrane; IEA:UniProtKB-KW.
DR   GO; GO:0098590; C:plasma membrane region; IEA:UniProt.
DR   GO; GO:0005524; F:ATP binding; IEA:UniProtKB-UniRule.
DR   GO; GO:0004714; F:transmembrane receptor protein tyrosine kinase activity; IEA:UniProtKB-EC.
DR   GO; GO:0042127; P:regulation of cell population proliferation; IEA:UniProt.
DR   GO; GO:0007169; P:transmembrane receptor protein tyrosine kinase signaling pathway; IEA:InterPro.
DR   CDD; cd00064; FU; 3.
DR   Gene3D; 3.80.20.20; -; 2.
DR   Gene3D; 6.10.250.2930; -; 1.
DR   InterPro; IPR044912; Egfr_JX_dom.
DR   InterPro; IPR006211; Furin-like_Cys-rich_dom.
DR   InterPro; IPR006212; Furin_repeat.
DR   InterPro; IPR032778; GF_recep_IV.
DR   InterPro; IPR009030; Growth_fac_rcpt_cys_sf.
DR   InterPro; IPR011009; Kinase-like_dom_sf.
DR   InterPro; IPR000719; Prot_kinase_dom.
DR   InterPro; IPR017441; Protein_kinase_ATP_BS.
DR   InterPro; IPR000494; Rcpt_L-dom.
DR   InterPro; IPR036941; Rcpt_L-dom_sf.
DR   InterPro; IPR001245; Ser-Thr/Tyr_kinase_cat_dom.
DR   InterPro; IPR008266; Tyr_kinase_AS.
DR   InterPro; IPR020635; Tyr_kinase_cat_dom.
DR   InterPro; IPR016245; Tyr_kinase_EGF/ERB/XmrK_rcpt.
DR   Pfam; PF00757; Furin-like; 1.
DR   Pfam; PF14843; GF_recep_IV; 1.
DR   Pfam; PF07714; PK_Tyr_Ser-Thr; 1.
DR   Pfam; PF01030; Recep_L_domain; 2.
DR   PIRSF; PIRSF000619; TyrPK_EGF-R; 2.
DR   PRINTS; PR00109; TYRKINASE.
DR   SMART; SM00261; FU; 4.
DR   SMART; SM00219; TyrKc; 1.
DR   SUPFAM; SSF56112; SSF56112; 1.
DR   SUPFAM; SSF57184; SSF57184; 2.
DR   PROSITE; PS00107; PROTEIN_KINASE_ATP; 1.
DR   PROSITE; PS50011; PROTEIN_KINASE_DOM; 1.
DR   PROSITE; PS00109; PROTEIN_KINASE_TYR; 1.
PE   3: Inferred from homology;
KW   ATP-binding {ECO:0000256|ARBA:ARBA00022840, ECO:0000256|PIRNR:PIRNR000619};
KW   Kinase {ECO:0000256|ARBA:ARBA00022777, ECO:0000256|PIRNR:PIRNR000619};
KW   Membrane {ECO:0000256|ARBA:ARBA00023136, ECO:0000256|PIRNR:PIRNR000619};
KW   Nucleotide-binding {ECO:0000256|ARBA:ARBA00022741,
KW   ECO:0000256|PIRNR:PIRNR000619};
KW   Phosphoprotein {ECO:0000256|ARBA:ARBA00022553};
KW   Receptor {ECO:0000256|ARBA:ARBA00023170, ECO:0000256|PIRNR:PIRNR000619};
KW   Reference proteome {ECO:0000313|Proteomes:UP000002281};
KW   Signal {ECO:0000256|SAM:SignalP};
KW   Transferase {ECO:0000256|ARBA:ARBA00022679, ECO:0000256|PIRNR:PIRNR000619};
KW   Transmembrane {ECO:0000256|ARBA:ARBA00022692, ECO:0000256|SAM:Phobius};
KW   Transmembrane helix {ECO:0000256|ARBA:ARBA00022989,
KW   ECO:0000256|SAM:Phobius};
KW   Tyrosine-protein kinase {ECO:0000256|ARBA:ARBA00023137,
KW   ECO:0000256|PIRNR:PIRNR000619}.
FT   SIGNAL          1..24
FT                   /evidence="ECO:0000256|SAM:SignalP"
FT   CHAIN           25..1192
FT                   /note="Receptor protein-tyrosine kinase"
FT                   /evidence="ECO:0000256|SAM:SignalP"
FT                   /id="PRO_5018752115"
FT   TRANSMEM        646..668
FT                   /note="Helical"
FT                   /evidence="ECO:0000256|SAM:Phobius"
FT   DOMAIN          712..979
FT                   /note="Protein kinase"
FT                   /evidence="ECO:0000259|PROSITE:PS50011"
FT   REGION          1078..1122
FT                   /note="Disordered"
FT                   /evidence="ECO:0000256|SAM:MobiDB-lite"
FT   COMPBIAS        1081..1095
FT                   /note="Polar residues"
FT                   /evidence="ECO:0000256|SAM:MobiDB-lite"
FT   ACT_SITE        837
FT                   /note="Proton acceptor"
FT                   /evidence="ECO:0000256|PIRSR:PIRSR000619-1"
FT   BINDING         718..726
FT                   /ligand="ATP"
FT                   /ligand_id="ChEBI:CHEBI:30616"
FT                   /evidence="ECO:0000256|PIRSR:PIRSR000619-2"
FT   BINDING         745
FT                   /ligand="ATP"
FT                   /ligand_id="ChEBI:CHEBI:30616"
FT                   /evidence="ECO:0000256|PIRSR:PIRSR000619-2,
FT                   ECO:0000256|PROSITE-ProRule:PRU10141"
SQ   SEQUENCE   1192 AA;  132850 MW;  A131BB33E5064309 CRC64;
     MRHSGTVGAA LLVLLAAYFQ ASPALEEKKV CQGTSNRLTQ LGTFEDHFLS LQRMFNNCEV
     VLGNLEITYM QKNYDLSFLK TIQEVAGYVL IALNTVEKIP LENLQIIRGN VLYENTHALS
     VLSNYGANKV GLRELPMRNL QEILQGAVRF SNNPILCNME TIQWRDIVNS DFLSNMSVDF
     QNQLGSCQKC DPACPNGSCW GVGKENCQKL TKTICAQQCS GRCRGRSPSD CCHNQCAAGC
     TGPRESDCLV CRKFRDEATC KDTCPPLMLY NPTTYQMDVN PDGKYSFGAT CVKKCPRNYV
     VTDHGSCVRA CSSDSYEVEE DGVRKCKKCE GPCRKVCNGI GIGEFKDTLS INATNIKHFK
     NCTSISGDLH ILPVAFRGDS FTRTPPLDPK ELDILQTVKE ITGFLLIQAW PENRTDLHAF
     ENLEIIRGRT KQHGQFSLAV VGLDITSLGL RSLKEISDGD VIISGNRNLC YANTIKWKKL
     FGTSSQKTKI INNRSEKDCK TVGHVCNLLC SSEGCWGPEP RDCVSCQNVS RGKECVEKCN
     ILEGEPREFV ENSECIQCHP ECLPQAMNIT CTGRGPDNCI KCAHYIDGPH CVKTCPSGIM
     GENNTLVWKF ADANHVCHLC HPNCTYGCAG PGLEGCARNG PKIPSIATGI VGGLLLVVVV
     ALGIGLFLRR RHIVRKRTLR RLLQERELVE PLTPSGEAPN QALLRILKET EFKKIKVLGS
     GAFGTVYKGL WIPEGEKVKI PVAIKELREA TSPKANKEIL DEAYVMASVD NPHVCRLLGI
     CLTSTVQLIT QLMPFGCLLD YVREHKDNIG SQYLLNWCVQ IAKGMNYLED RRLVHRDLAA
     RNVLVKTPQH VKITDFGLAK LLGAEEKEYH AEGGKVPIKW MALESILHRI YTHQSDVWSY
     GVTVWELMTF GSKPYDGIPA SEISTILEKG ERLPQPPICT IDVYMIMVKC WMIDADSRPK
     FRELIIEFSK MARDPQRYLV IQGDERMHLP SPTDSNFYRT LMDEEDMEDV VDADEYLIPQ
     QGFFHSPSTS RTPLISSLSC PLKEDSFLQR YSSDPTGTVT EDNIDDTFLP APEYVNQSVP
     KRPAGSVQNP VYHNQPLNPA PGRDPHYQNP HSNAMDNPEY LNTTHPDCVN SVLDGTALWA
     QKGNHQISLD NPDYQQDFFP KEAKSNGIFK GPAAENAEYL RVAPPSSEFI GA
//