位置:首页 > 蛋白库 > CO1A1_ORYAF
CO1A1_ORYAF
ID   CO1A1_ORYAF             Reviewed;         987 AA.
AC   C0HJN3;
DT   22-JUL-2015, integrated into UniProtKB/Swiss-Prot.
DT   22-JUL-2015, sequence version 1.
DT   03-AUG-2022, entry version 14.
DE   RecName: Full=Collagen alpha-1(I) chain {ECO:0000303|PubMed:25799987};
DE   AltName: Full=Alpha-1 type I collagen {ECO:0000250|UniProtKB:P02452};
DE   Flags: Fragments;
GN   Name=COL1A1 {ECO:0000250|UniProtKB:P02452};
OS   Orycteropus afer (Aardvark).
OC   Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi; Mammalia;
OC   Eutheria; Afrotheria; Tubulidentata; Orycteropodidae; Orycteropus.
OX   NCBI_TaxID=9818 {ECO:0000303|PubMed:25799987};
RN   [1] {ECO:0000305}
RP   PROTEIN SEQUENCE, AND IDENTIFICATION BY MASS SPECTROMETRY.
RC   TISSUE=Bone {ECO:0000303|PubMed:25799987};
RX   PubMed=25799987; DOI=10.1038/nature14249;
RA   Welker F., Collins M.J., Thomas J.A., Wadsley M., Brace S., Cappellini E.,
RA   Turvey S.T., Reguero M., Gelfo J.N., Kramarz A., Burger J.,
RA   Thomas-Oates J., Ashford D.A., Ashton P.D., Rowsell K., Porter D.M.,
RA   Kessler B., Fischer R., Baessmann C., Kaspar S., Olsen J.V., Kiley P.,
RA   Elliott J.A., Kelstrup C.D., Mullin V., Hofreiter M., Willerslev E.,
RA   Hublin J.J., Orlando L., Barnes I., MacPhee R.D.;
RT   "Ancient proteins resolve the evolutionary history of Darwin's South
RT   American ungulates.";
RL   Nature 522:81-84(2015).
CC   -!- FUNCTION: Type I collagen is a member of group I collagen (fibrillar
CC       forming collagen). {ECO:0000305}.
CC   -!- SUBUNIT: Trimers of one alpha 2(I) and two alpha 1(I) chains.
CC       {ECO:0000305}.
CC   -!- SUBCELLULAR LOCATION: Secreted. Secreted, extracellular space.
CC       Secreted, extracellular space, extracellular matrix {ECO:0000305}.
CC   -!- TISSUE SPECIFICITY: Forms the fibrils of tendon, ligaments and bones.
CC       In bones, the fibrils are mineralized with calcium hydroxyapatite.
CC       {ECO:0000305}.
CC   -!- PTM: Prolines at the third position of the tripeptide repeating unit
CC       (G-X-Y) are hydroxylated in some or all of the chains. {ECO:0000305}.
CC   -!- SIMILARITY: Belongs to the fibrillar collagen family. {ECO:0000305}.
CC   ---------------------------------------------------------------------------
CC   Copyrighted by the UniProt Consortium, see https://www.uniprot.org/terms
CC   Distributed under the Creative Commons Attribution (CC BY 4.0) License
CC   ---------------------------------------------------------------------------
DR   AlphaFoldDB; C0HJN3; -.
DR   PRIDE; C0HJN3; -.
DR   GO; GO:0005581; C:collagen trimer; IEA:UniProtKB-KW.
DR   GO; GO:0005615; C:extracellular space; IEA:UniProtKB-SubCell.
DR   InterPro; IPR008160; Collagen.
DR   Pfam; PF01391; Collagen; 8.
PE   1: Evidence at protein level;
KW   Calcium; Collagen; Direct protein sequencing; Extracellular matrix;
KW   Hydroxylation; Phosphoprotein; Repeat; Secreted.
FT   CHAIN           1..987
FT                   /note="Collagen alpha-1(I) chain"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT                   /id="PRO_0000433497"
FT   REGION          1..987
FT                   /note="Disordered"
FT                   /evidence="ECO:0000256|SAM:MobiDB-lite"
FT   COMPBIAS        1..48
FT                   /note="Pro residues"
FT                   /evidence="ECO:0000256|SAM:MobiDB-lite"
FT   COMPBIAS        365..388
FT                   /note="Pro residues"
FT                   /evidence="ECO:0000256|SAM:MobiDB-lite"
FT   COMPBIAS        701..715
FT                   /note="Pro residues"
FT                   /evidence="ECO:0000256|SAM:MobiDB-lite"
FT   COMPBIAS        795..809
FT                   /note="Pro residues"
FT                   /evidence="ECO:0000256|SAM:MobiDB-lite"
FT   COMPBIAS        957..987
FT                   /note="Pro residues"
FT                   /evidence="ECO:0000256|SAM:MobiDB-lite"
FT   MOD_RES         93
FT                   /note="Phosphoserine"
FT                   /evidence="ECO:0000250|UniProtKB:P02454"
FT   UNSURE          11
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          77
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          83
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          95
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          128
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          227
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          278
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          302
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          350
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          356
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          461
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          479
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          483
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          542
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          554
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          581
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          585
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          669
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          728
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          760
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          769
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          778
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          808
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          881
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          913
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          952
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          955
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   UNSURE          959
FT                   /note="I or L"
FT                   /evidence="ECO:0000269|PubMed:25799987"
FT   NON_CONS        309..310
FT                   /evidence="ECO:0000303|PubMed:25799987"
FT   NON_CONS        678..679
FT                   /evidence="ECO:0000303|PubMed:25799987"
FT   NON_CONS        716..717
FT                   /evidence="ECO:0000303|PubMed:25799987"
FT   NON_CONS        773..774
FT                   /evidence="ECO:0000303|PubMed:25799987"
FT   NON_CONS        908..909
FT                   /evidence="ECO:0000303|PubMed:25799987"
FT   NON_CONS        965..966
FT                   /evidence="ECO:0000303|PubMed:25799987"
SQ   SEQUENCE   987 AA;  87663 MW;  4704BDAB87565386 CRC64;
     GPMGPSGPRG IPGPPGAPGP QGFQGPPGEP GEPGASGPMG PRGPPGPPGK NGDDGEAGKP
     GRPGERGPPG PQGARGIPGT AGIPGMKGHR GFSGIDGAKG DAGPAGPKGE PGSPGENGAP
     GQMGPRGIPG ERGRPGPPGP AGARGNDGAT GAAGPPGPTG PAGPPGFPGA VGAKGEAGPQ
     GPRGSEGPQG VRGEPGPPGP AGAAGPAGNP GADGQPGAKG ANGAPGIAGA PGFPGARGPS
     GPQGPSGAPG PKGNSGEPGA PGNKGDAGAK GEPGPAGIQG PPGPAGEEGK RGARGEPGPT
     GIPGPPGERG FPGSDGVAGP KGPVGERGSP GPAGPKGSPG EAGRPGEAGI PGAKGITGSP
     GSPGPDGKTG PPGPAGQDGR PGPPGPPGAR GQAGVMGFPG PKGAAGEPGK AGERGVPGPP
     GAVGAPGKDG EAGAPGATGP AGPAGERGEQ GPAGSPGFQG IPGPAGPPGE SGKPGEQGIP
     GDIGAPGPSG ARGERGFPGE RGVQGPPGPA GPRGSNGAPG NDGAKGDAGA PGAPGSQGAP
     GIQGMPGERG AAGIPGPKGD RGDAGPKGAD GSPGKDGPRG ITGPIGPPGP AGAPGDKGES
     GPNGPAGPTG ARGAPGDRGE PGPPGPAGFA GPPGADGQPG AKGEPGDAGA KGDAGPPGPA
     GPTGAPGPIG NVGAPGPKGS PGPPGATGFP GAAGRVGPPG PSGNAGPPGP PGPAGKGETG
     PAGRPGEIGP PGPPGPSGEK GSPGADGPAG APGTPGPQGI GGQRGVVGIP GQRGFPGIPG
     PSGEPGKQGP SGPNGERGPP GPMGPPGIAG PPGESGREGS PGAEGSPGRD GSPGPKGDRG
     ETGPAGPPGA PGAPGAPGPV GPAGKSGDRG ETGPAGPAGP IGPVGARGPT GPQGPRGDKG
     ETGEQGDRGF SGIQGPPGPP GSPGEQGPSG ASGPAGPRGP PGSAGAPGKD GINGIPGPIG
     PPGPRTGDAG PVGPPGPPGP PGPPGPP
 
 
维奥蛋白资源库 - 中文蛋白资源 CopyRight © 2010-2024