{"ymdb_id":"YMDB00082","created_at":"2011-05-29T15:54:58.000Z","updated_at":"2016-09-08T18:34:59.000Z","name":"Carbamoylphosphate","cas":"590-55-6","state":"Solid","melting_point":"","description":"Carbamoylphosphate is required for the synthesis of arginine and pyrimidines. Carbamoylphosphate is produced from bicarbonate and glutamine in a ATP dependant reaction. ","experimental_water_solubility":"","experimental_logp_hydrophobicity":"","location":"cytoplasm","synthesis_reference":null,"chebi_id":"17672","hmdb_id":"HMDB01096","kegg_id":"C00169","pubchem_id":"278","cs_id":"272","foodb_id":null,"wikipedia_link":"Carbamoyl_phosphate","biocyc_id":"CARBAMOYL-P","iupac":"(carbamoyloxy)phosphonic acid","traditional_iupac":"carbamoyl-phosphate","logp":"-1.2107563936666663","pka":"6.126245825395335","alogps_solubility":"1.56e+01 g/l","alogps_logp":"-1.52","alogps_logs":"-0.96","acceptor_count":"4","donor_count":"3","rotatable_bond_count":"2","polar_surface_area":"109.85","refractivity":"22.4801","polarizability":"9.115059988547511","formal_charge":"0","physiological_charge":"-2","pka_strongest_basic":null,"pka_strongest_acidic":"1.1011909792872663","bioavailability":"1","number_of_rings":"0","rule_of_five":"1","ghose_filter":"0","veber_rule":"0","mddr_like_rule":"0","synonyms":["carbamic acid monoanhydride with phosphorate","carbamic acid monoanhydride with phosphoric acid","Carbamoyl phosphate","carbamoyl-P","carbamoyl-phosphate","Carbamoylphosphate","Carbamoylphosphic acid","carbamyl phosphate","carbamyl-phosphate"],"pathways":[{"name":"Purine metabolism","kegg_map_id":"00230"},{"name":"Pyrimidine metabolism","kegg_map_id":"00240"},{"name":"Alanine, aspartate and glutamate metabolism","kegg_map_id":"00250"},{"name":"Arginine and proline metabolism","kegg_map_id":"00330"},{"name":"Nitrogen metabolism","kegg_map_id":"00910"}],"growth_conditions":[],"references":[{"pubmed_id":21051339,"citation":"UniProt Consortium (2011). \"Ongoing and future developments at the Universal Protein Resource.\" Nucleic Acids Res 39:D214-D219."},{"pubmed_id":21062828,"citation":"Scheer, M., Grote, A., Chang, A., Schomburg, I., Munaretto, C., Rother, M., Sohngen, C., Stelzer, M., Thiele, J., Schomburg, D. (2011). \"BRENDA, the enzyme information system in 2011.\" Nucleic Acids Res 39:D670-D676."},{"pubmed_id":18846089,"citation":"Herrgard, M. J., Swainston, N., Dobson, P., Dunn, W. B., Arga, K. Y., Arvas, M., Bluthgen, N., Borger, S., Costenoble, R., Heinemann, M., Hucka, M., Le Novere, N., Li, P., Liebermeister, W., Mo, M. L., Oliveira, A. P., Petranovic, D., Pettifer, S., Simeonidis, E., Smallbone, K., Spasic, I., Weichart, D., Brent, R., Broomhead, D. S., Westerhoff, H. V., Kirdar, B., Penttila, M., Klipp, E., Palsson, B. O., Sauer, U., Oliver, S. G., Mendes, P., Nielsen, J., Kell, D. B. (2008). \"A consensus yeast metabolic network reconstruction obtained from a community approach to systems biology.\" Nat Biotechnol 26:1155-1160."},{"pubmed_id":15128434,"citation":"Serre, V., Penverne, B., Souciet, J. L., Potier, S., Guy, H., Evans, D., Vicart, P., Herve, G. (2004). \"Integrated allosteric regulation in the S. cerevisiae carbamylphosphate synthetase - aspartate transcarbamylase multifunctional protein.\" BMC Biochem 5:6."},{"pubmed_id":6370999,"citation":"Eisenstein, E., Osborne, J. C. Jr, Chaiken, I. M., Hensley, P. (1984). \"Purification and characterization of ornithine transcarbamoylase from Saccharomyces cerevisiae.\" J Biol Chem 259:5139-5145."}],"proteins":[{"created_at":"2011-05-24T19:26:20.000Z","updated_at":"2011-05-29T05:06:11.000Z","name":"Carbamoyl-phosphate synthase arginine-specific small chain","uniprot_id":"P07258","uniprot_name":"CARA_YEAST","enzyme":true,"transporter":false,"gene_name":"CPA1","num_residues":411,"molecular_weight":"45361.19922","theoretical_pi":"7.32","general_function":"Involved in catalytic activity","specific_function":"2 ATP + L-glutamine + HCO(3)(-) + H(2)O = 2 ADP + phosphate + L-glutamate + carbamoyl phosphate","reactions":[{"id":2254,"direction":"\u003e","locations":"Cytoplasm","altext":"2 ATP + L-glutamine + HCO(3)(-) + H(2)O = 2 ADP + phosphate + L-glutamate + carbamoyl phosphate.","export":false,"pw_reaction_id":null,"source":null}],"signal_regions":"None","transmembrane_regions":"None","pdb_id":null,"cellular_location":"Cytoplasm","genbank_gene_id":"K02132","genbank_protein_id":"171305","gene_card_id":"CPA1","chromosome_location":"chromosome 15","locus":"YOR303W","synonyms":["CPS-A","Arginine-specific carbamoyl-phosphate synthetase, glutamine chain"],"enzyme_classes":["6.3.5.5"],"go_classes":[{"category":"Component","description":" Not Available"},{"category":"Function","description":" carbamoyl-phosphate synthase activity"},{"category":"Function","description":" catalytic activity"},{"category":"Function","description":" ligase activity"},{"category":"Function","description":" ligase activity, forming carbon-nitrogen bonds"},{"category":"Process","description":" glutamine family amino acid metabolic process"},{"category":"Process","description":" glutamine metabolic process"},{"category":"Process","description":" metabolic process"},{"category":"Process","description":" nitrogen compound metabolic process"},{"category":"Process","description":" cellular metabolic process"},{"category":"Process","description":" cellular amino acid and derivative metabolic process"},{"category":"Process","description":" cellular amino acid metabolic process"}],"pfams":[{"name":"GATase","identifier":"PF00117"},{"name":"CPSase_sm_chain","identifier":"PF00988"}],"pathways":[{"name":"Pyrimidine metabolism","kegg_map_id":"00240"},{"name":"Alanine, aspartate and glutamate metabolism","kegg_map_id":"00250"}],"gene_sequence":"ATGTCCTCCGCTGCAACAAAAGCTACTTTCTGTATTCAAAATGGTCCTTCCTTTGAAGGTATATCTTTTGGTGCAAACAAATCTGTTGCTGGTGAAACAGTTTTCACTACTTCTCTGGTTGGTTACCCAGAGTCCATGACTGATCCTTCCTACCGTGGTCAGATATTAGTCTTCACGCAACCCTTGATTGGTAACTACGGTGTCCCATCCGGCGAAGCCCGCGATGAATACAATTTACTGAAGTATTTTGAATCTCCGCATATACATGTGGTCGGCATCGTTGTCGCTGAATATGCTTATCAATATTCGCATTGGACCGCTGTTGAATCTCTGGCACAATGGTGTCAGAGAGAAGGTGTTGCTGCTATTACTGGCGTAGACACCCGTGAACTAGTGCAATACTTGAGGGAACAAGGTTCTTCTTTGGGCCGTATTACGTTGGCTGATCATGACCCTGTCCCCTACGTGAATCCCATGAAAACTAACTTGGTTGCTCAAGTCACCACAAAAAAGCCTTTCCACGTCTCTGCCTTACCTGGGAAGGCTAAGGCAAATGTGGCTCTTATTGACTGTGGTGTTAAAGAAAACATTATCAGATGCCTAGTCAAAAGAGGTGCCAATGTAACTGTTTTCCCCTATGATTACAGAATTCAAGATGTTGCTTCTGAATTCGACGGTATTTTCTTATCCAATGGACCAGGCAACCCAGAACTATGCCAAGCTACAATTTCCAACGTCAGGGAATTACTAAATAACCCTGTTTATGACTGTATCCCTATTTTTGGGATTTGTCTAGGCCATCAACTCTTGGCTCTGGCCTCCGGTGCCTCTACTCACAAATTGAAATATGGTAATAGGGCTCACAACATCCCTGCCATGGATTTGACTACCGGCCAGTGCCACATTACATCTCAAAATCATGGCTATGCAGTTGATCCTGAGACCCTACCAAAGGACCAATGGAAACCTTATTTTGTTAATTTAAACGACAAATCAAACGAAGGCATGATACACCTTCAAAGACCCATATTTTCTACCCAATTTCACCCAGAGGCAAAAGGTGGTCCCTTAGACACAGCTATTCTTTTTGACAAATTCTTCGATAATATAGAAAAATACCAATTACAATCTCAGGCAAAAAGTTCAATCTCACTAAAAGTAACATACAGTACCGATAAATCGAGATTGCAGAGTATAAATGTTACTAAGTTGGCCAAGGAAAGAGTGTTGTTCTAA","protein_sequence":"MSSAATKATFCIQNGPSFEGISFGANKSVAGETVFTTSLVGYPESMTDPSYRGQILVFTQPLIGNYGVPSGEARDEYNLLKYFESPHIHVVGIVVAEYAYQYSHWTAVESLAQWCQREGVAAITGVDTRELVQYLREQGSSLGRITLADHDPVPYVNPMKTNLVAQVTTKKPFHVSALPGKAKANVALIDCGVKENIIRCLVKRGANVTVFPYDYRIQDVASEFDGIFLSNGPGNPELCQATISNVRELLNNPVYDCIPIFGICLGHQLLALASGASTHKLKYGNRAHNIPAMDLTTGQCHITSQNHGYAVDPETLPKDQWKPYFVNLNDKSNEGMIHLQRPIFSTQFHPEAKGGPLDTAILFDKFFDNIEKYQLQSQAKSSISLKVTYSTDKSRLQSINVTKLAKERVLF"},{"created_at":"2011-05-24T19:28:29.000Z","updated_at":"2011-07-22T17:54:22.000Z","name":"Protein URA1","uniprot_id":"P07259","uniprot_name":"PYR1_YEAST","enzyme":true,"transporter":false,"gene_name":"URA2","num_residues":2214,"molecular_weight":"245124.0","theoretical_pi":"5.64","general_function":"Involved in carboxyl- or carbamoyltransferase activity","specific_function":"This protein is a \"fusion\" protein encoding three enzymatic activities of the pyrimidine pathway (GATase, CPSase, and ATCase)","reactions":[{"id":1332,"direction":"\u003e","locations":"cytoplasm","altext":null,"export":true,"pw_reaction_id":null,"source":null},{"id":1365,"direction":"\u003e","locations":"cytoplasm","altext":null,"export":true,"pw_reaction_id":null,"source":null},{"id":2254,"direction":"\u003e","locations":"Cytoplasm","altext":"2 ATP + L-glutamine + HCO(3)(-) + H(2)O = 2 ADP + phosphate + L-glutamate + carbamoyl phosphate.","export":false,"pw_reaction_id":null,"source":null},{"id":2256,"direction":"\u003e","locations":null,"altext":"Carbamoyl phosphate + L-aspartate = phosphate + N-carbamoyl-L-aspartate.","export":false,"pw_reaction_id":null,"source":null},{"id":3739,"direction":"\u003e","locations":null,"altext":null,"export":true,"pw_reaction_id":"PW_R006264","source":"Smpdb"},{"id":14248,"direction":"\u003e","locations":null,"altext":null,"export":true,"pw_reaction_id":"PW_R006692","source":"Smpdb"},{"id":14248,"direction":"\u003e","locations":null,"altext":null,"export":true,"pw_reaction_id":"PW_R006692","source":"Smpdb"},{"id":14249,"direction":"\u003e","locations":null,"altext":null,"export":true,"pw_reaction_id":"PW_R006733","source":"Smpdb"}],"signal_regions":"None","transmembrane_regions":"None","pdb_id":null,"cellular_location":null,"genbank_gene_id":"M27174","genbank_protein_id":"173146","gene_card_id":"URA2","chromosome_location":"chromosome 10","locus":"YJL130C","synonyms":["Glutamine-dependent carbamoyl-phosphate synthase","Aspartate carbamoyltransferase"],"enzyme_classes":["6.3.5.5","2.1.3.2"],"go_classes":[{"category":"Component","description":" Not Available"},{"category":"Function","description":" binding"},{"category":"Function","description":" nucleoside binding"},{"category":"Function","description":" purine nucleoside binding"},{"category":"Function","description":" adenyl nucleotide binding"},{"category":"Function","description":" catalytic activity"},{"category":"Function","description":" adenyl ribonucleotide binding"},{"category":"Function","description":" transferase activity"},{"category":"Function","description":" ATP binding"},{"category":"Function","description":" carbamoyl-phosphate synthase activity"},{"category":"Function","description":" ligase activity"},{"category":"Function","description":" aspartate carbamoyltransferase activity"},{"category":"Function","description":" ligase activity, forming carbon-nitrogen bonds"},{"category":"Function","description":" carboxylic acid binding"},{"category":"Function","description":" amino acid binding"},{"category":"Function","description":" carboxyl- or carbamoyltransferase activity"},{"category":"Function","description":" transferase activity, transferring one-carbon groups"},{"category":"Process","description":" cellular amino acid and derivative metabolic process"},{"category":"Process","description":" nucleobase metabolic process"},{"category":"Process","description":" cellular amino acid metabolic process"},{"category":"Process","description":" pyrimidine base metabolic process"},{"category":"Process","description":" glutamine family amino acid metabolic process"},{"category":"Process","description":" pyrimidine base biosynthetic process"},{"category":"Process","description":" glutamine metabolic process"},{"category":"Process","description":" 'de novo' pyrimidine base biosynthetic process"},{"category":"Process","description":" metabolic process"},{"category":"Process","description":" nitrogen compound metabolic process"},{"category":"Process","description":" cellular aromatic compound metabolic process"},{"category":"Process","description":" cellular metabolic process"}],"pfams":[{"name":"GATase","identifier":"PF00117"},{"name":"CPSase_sm_chain","identifier":"PF00988"},{"name":"CPSase_L_chain","identifier":"PF00289"},{"name":"CPSase_L_D2","identifier":"PF02786"},{"name":"CPSase_L_D3","identifier":"PF02787"},{"name":"MGS","identifier":"PF02142"},{"name":"OTCace","identifier":"PF00185"},{"name":"OTCace_N","identifier":"PF02729"}],"pathways":[{"name":"Pyrimidine metabolism","kegg_map_id":"00240"},{"name":"Alanine, aspartate and glutamate metabolism","kegg_map_id":"00250"}],"gene_sequence":"ATGGCCACTATTGCTCCCACTGCTCCAATCACCCCTCCAATGGAATCTACGGGTGACCGTCTGGTTACGTTGGAACTTAAGGACGGCACGGTCTTACAAGGTTATTCATTTGGTGCTGAGAAATCCGTCGCTGGTGAATTAGTTTTCCAAACTGGTATGGTTGGTTATCCTGAATCTGTGACCGATCCATCTTATGAAGGCCAGATCTTAGTCATCACTTACCCATTGGTAGGCAATTATGGTGTCCCAGATATGCACTTGAGAGATGAATTGGTCGAAGAATTGCCAAGATATTTTGAAAGTAATAGAATCCATATTGCCGGTTTAGTTATTTCTCACTATACCGACGAGTACTCTCATTATCTTGCTAAATCTTCCTTAGGTAAATGGTTACAAAATGAAGGGATCCCAGCTGTTTATGGTGTTGATACAAGATCATTGACCAAGCATTTGAGAGATGCAGGTTCAATGTTGGGTAGGTTGTCTTTGGAAAAAAGCGGCTCTGACAGAACCATCTCCAGATCTTCCTCTTGGAGAAGTGCGTTTGATGTTCCTGAATGGGTGGATCCAAATGTTCAAAACCTAGTTTCTAAGGTCTCCATCAATGAACCTAAATTGTACGTTCCTCCAGCAGACAATAAGCACATCGAATTGCAAACCGGACCCGATGGTAAAGTTTTAAGGATTCTAGCCATTGACGTGGGTATGAAATACAATCAAATTCGTTGTTTTATCAAAAGGGGTGTAGAATTGAAAGTTGTTCCATGGAACTACGATTTCACTAAAGAAGATTATGATGGTCTGTTTATTTCAAATGGTCCAGGTGATCCATCTGTTCTAGATGATCTATCTCAAAGATTGTCAAATGTCCTGGAGGCTAAAAAGACGCCAGTATTCGGTATTTGTCTCGGTCATCAATTGATAGCAAGAGCTGCCGGTGCATCCACCCTAAAACTAAAATTTGGTAACCGTGGTCATAACATACCTTGTACATCAACTATAAGTGGTCGTTGTTACATAACATCTCAAAACCATGGGTTCGCTGTGGATGTTGACACTCTAACTTCCGGATGGAAGCCATTGTTTGTTAACGCGAATGATGACTCTAACGAAGGTATCTATCATTCTGAATTACCTTATTTTTCCGTCCAATTCCATCCAGAATCCACACCTGGCCCAAGAGATACAGAATTCTTGTTTGACGTTTTTATCCAAGCAGTTAAAGAATTCAAGTATACACAAGTGTTGAAACCAATCGCTTTCCCAGGTGGCCTATTAGAGGATAACGTTAAGGCACACCCTAGAATCGAAGCGAAGAAGGTTCTAGTTCTCGGTTCTGGTGGTTTGTCCATCGGTCAAGCTGGTGAATTTGACTACTCTGGTTCTCAAGCCATCAAAGCTTTGAAAGAAGAAGGTATCTATACAATTTTAATTAATCCAAACATTGCTACCATCCAAACTTCGAAAGGGTTGGCTGATAAGGTTTATTTTGTTCCTGTTACTGCAGAGTTCGTGAGAAAAGTTATTTTACATGAAAGGCCGGACGCCATTTATGTGACATTTGGTGGACAAACTGCTTTATCTGTTGGTATAGCCATGAAAGATGAATTTGAGGCGTTAGGAGTTAAAGTATTGGGTACTCCAATCGATACTATTATTACCACGGAAGACCGTGAACTCTTCAGTAATGCCATTGACGAAATTAATGAAAAATGTGCGAAATCTCAAGCTGCTAATTCAGTGGACGAGGCATTGGCCGCTGTCAAGGAGATCGGTTTCCCAGTTATTGTACGTGCTGCATATGCATTGGGAGGTTTAGGTTCCGGTTTCGCTAATAATGAAAAAGAATTGGTTGATCTATGTAATGTTGCATTTTCATCCTCACCTCAAGTTTTAGTCGAGAAATCTATGAAAGGTTGGAAAGAAGTCGAATATGAAGTTGTTCGTGATGCTTTTGACAACTGTATTACTGTTTGTAATATGGAAAATTTTGATCCACTAGGTATTCACACCGGTGATTCCATCGTTGTAGCCCCATCTCAAACTTTATCTGATGAAGATTACAATATGTTAAGAACTACTGCTGTTAATGTTATTAGACACTTAGGTGTTGTTGGTGAATGTAATATCCAATATGCTTTAAATCCCGTTTCTAAGGATTATTGCATCATTGAAGTTAATGCGCGTTTGTCACGTTCCTCTGCTTTAGCTTCTAAGGCTACTGGTTACCCATTGGCCTACACTGCGGCTAAGTTAGGTTTGAATATCCCATTAAATGAAGTTAAGAATTCCGTCACAAAATCCACATGTGCTTGTTTTGAACCTTCTCTAGACTACTGTGTTGTCAAAATGCCAAGATGGGATTTGAAGAAGTTCACCAGAGTTTCTACCGAATTATCTTCATCAATGAAATCTGTTGGTGAAGTTATGAGCATCGGTAGAACCTTCGAAGAAGCTATTCAAAAAGCTATCAGATCCACAGAATATGCTAACCTCGGATTCAATGAGACAGATCTAGATATCGACATTGATTACGAGTTGAACAACCCTACGGATATGCGTGTCTTCGCCATTGCAAATGCTTTTGCTAAGAAGGGATATTCTGTTGATAAAGTCTGGGAAATGACTAGAATTGATAAGTGGTTTTTAAACAAACTGCACGATTTGGTCCAATTTGCTGAGAAAATTAGTTCATTTGGTACTAAAGAGGAATTACCTTCCTTAGTTTTAAGACAGGCTAAGCAGTTAGGTTTTGATGACAGACAGATTGCAAGATTTTTGGATTCCAACGAAGTTGCCATCCGTAGATTAAGAAAAGAATATGGAATTACACCATTTGTCAAACAAATTGATACAGTTGCCGCTGAATTCCCCGCTTACACGAACTATTTATACATGACATACAATGCTGACTCACACGATTTATCCTTTGATGACCACGGTGTTATGGTCTTGGGTTCTGGTGTTTACCGTATCGGTTCTTCTGTCGAATTTGATTGGTGTGCTGTTACTGCAGTTAGAACATTACGTGCCAACAATATCAAAACTATCATGGTCAACTATAATCCAGAAACTGTTTCCACAGATTATGATGAGGCTGATAGACTATACTTTGAAACCATCAACCTTGAAAGAGTTTTGGATATTTACGAGATTGAAAACTCAAGCGGTGTTGTCGTATCAATGGGTGGTCAAACTTCCAACAACATCGCCATGACTTTACATCGTGAAAATGTAAAGATTCTTGGTACATCCCCTGACATGATTGATTCTGCTGAAAACCGTTACAAGTTCTCTCGTATGTTGGATCAAATTGGTGTTGACCAACCAGCTTGGAAAGAATTGACATCCATGGACGAAGCTGAATCTTTTGCCGAAAAGGTGGGTTATCCAGTTTTGGTACGTCCATCTTATGTGTTATCCGGTGCCGCCATGAATACTGTTTATTCTAAAAACGATTTGGAATCCTACTTAAACCAAGCCGTCGAAGTTTCACGTGATTATCCTGTTGTTATCACTAAATATATTGAAAACGCAAAGGAGATTGAAATGGATGCAGTTGCAAGAAATGGTGAATTGGTTATGCATGTTGTCTCTGAGCATGTTGAAAATGCAGGTGTCCACTCGGGTGATGCAACATTAATCGTTCCACCTCAAGATTTGGCTCCTGAAACTGTGGATAGAATTGTTGTCGCCACTGCTAAAATTGGTAAGGCTTTGAAAATTACAGGTCCATACAACATCCAATTCATTGCAAAGGACAATGAAATCAAGGTCATAGAATGTAATGTTCGTGCTTCGAGATCTTTCCCATTCATTTCAAAGGTTGTTGGCGTCAATCTGATTGAATTGGCAACAAAGGCCATAATGGGTTTGCCTTTGACGCCTTATCCTGTTGAAAAATTACCAGATGATTATGTCGCCGTTAAAGTACCACAATTCTCTTTCCCACGTTTAGCAGGAGCTGATCCAGTCTTAGGTGTTGAAATGGCCTCTACTGGTGAAGTCGCTACTTTTGGCCACTCGAAGTATGAAGCATACTTAAAGTCTTTGTTGGCAACCGGCTTCAAACTTCCAAAGAAGAATATTTTATTGTCTATTGGTTCTTACAAGGAAAAACAAGAATTGCTTTCTTCCGTACAAAAACTATACAACATGGGATATAAATTATTTGCAACATCAGGTACTGCTGACTTTTTATCTGAACATGGTATTGCCGTCCAATATCTGGAGGTTTTAAACAAGGATGATGATGATCAAAAATCAGAATACTCACTTACTCAACATTTGGCTAATAATGAAATTGACCTTTACATCAACTTGCCTTCTGCCAACAGGTTCCGTCGTCCTGCATCCTATGTTTCAAAGGGGTATAAAACACGTCGTTTGGCTGTCGATTATTCGGTTCCGTTGGTTACTAACGTTAAATGTGCAAAATTGTTGATTGAAGCCATTTCAAGAAATATCACTTTAGATGTTTCTGAACGTGATGCACAAACTTCCCACAGAACTATTACCTTACCTGGTTTAATCAATATCGCAACTTATGTTCCGAATGCATCCCATGTTATCAAAGGCCCAGCTGAACTGAAGGAGACCACACGTCTATTTTTGGAATCCGGTTTTACATACTGTCAATTGATGCCCAGATCCATCAGCGGACCTGTTATTACTGACGTTGCATCCTTGAAGGCCGCAAACTCTGTTTCCCAAGATTCATCTTACACTGACTTTTCTTTCACTATTGCTGGTACAGCACACAATGCTCATAGTGTTACGCAATCTGCTAGCAAAGTGACAGCATTGTTTTTGCCCCTACGTGAATTAAAGAACAAGATCACAGCAGTAGCTGAACTTCTGAATCAGTGGCCAACTGAAAAGCAAGTGATTGCAGAAGCTAAAACTGCAGATTTGGCATCGGTTTTATTGTTAACCTCCCTTCAAAACAGATCTATTCACATTACTGGTGTTTCGAATAAGGAAGATTTAGCTTTGATCATGACGGTCAAGGCAAAAGACCCTAGAGTGACTTGTGATGTCAATATTTATTCTTTGTTTATTGCCCAAGATGACTATCCGGAGGCAGTTTTCTTGCCTACTAAGGAAGATCAAGAGTTTTTCTGGAACAACCTTGATAGTATCGATGCTTTCTCTGTCGGTGCTCTTCCTGTCGCCTTGGCAAATGTCACAGGTAACAAGGTTGATGTTGGTATGGGTATCAAAGATTCATTACCACTATTGTTGGCTGCTGTTGAAGAAGGTAAATTAACCATTGATGATATCGTCCTTCGTCTGCATGACAATCCCGCTAAAATTTTCAACATCCCTACTCAGGACTCAGTTGTCGAAATTGATTTGGATTATTCTTTCAGACGTAATAAGAGATGGTCACCATTCAACAAAGATATGAACGGTGGTATTGAGCGTGTTGTCTATAATGGCGAAACATTAGTTTTGAGCGGTGAATTAGTTTCACCAGGCGCCAAAGGAAAATGCATTGTTAATCCAAGTCCAGCTTCCATAACTGCTTCCGCAGAGCTCCAATCTACTAGTGCTAAAAGAAGGTTCTCGATCACGGAAGAAGCAATCGCTGATAATTTAGATGCCGCGGAGGATGCAATTCCAGAACAGCCTTTGGAACAAAAATTGATGTCTTCAAGGCCACCAAGAGAACTTGTTGCTCCAGGCGCCATCCAGAATTTGATCCGTAGTAACAATCCATTCCGCGGAAGACATATATTGTCTATCAAACAATTCAAACGTTCTGATTTCCATGTGTTGTTTGCTGTTGCACAAGAACTAAGGGCACGTGTCGCAAGAGAAGGTGTCTTAGATTTAATGAAAGGCCACGTTATTACTACAATTTTCTTTGAACCATCTACTCGTACTTGTTCTTCATTCATTGCTGCTATGGAACGTTTGGGTGGTAGAATTGTAAATGTTAATCCATTGGTGTCTTCTGTCAAGAAAGGTGAAACCCTTCAAGATACTATCAGAACTTTGGCTTGTTACAGTGATGCCATTGTCATGCGTCATTCAGAAGAAATGTCTGTTCATATCGCCGCTAAATATTCTCCTGTTCCAATTATTAATGGTGGTAATGGTTCTCGCGAGCATCCTACGCAGGCCTTCTTGGATTTGTTTACGATTCGTGAAGAAATCGGTACTGTTAATGGTATTACTGTTACTTTCATGGGTGATCTCAAACATGGTAGAACCGTACATTCATTGTGTCGTTTGTTAATGCACTATCAAGTCAGAATTAATCTTGTTTCTCCTCCGGAATTGAGGTTACCAGAAGGATTAAGAGAAGAGCTAAGAAAAGCTGGCTTACTTGGTGTTGAGAGCATTGAATTAACCCCTCATATCATCTCAAAGACCGATGTTCTGTATTGTACAAGGGTCCAAGAAGAAAGATTCAATAGCCCTGAAGAATATGCACGTCTGAAGGATACTTATATCGTGGACAACAAGATCTTGGCACACGCCAAAGAAAATATGGCTATCATGCATCCATTGCCTCGTGTAAATGAAATCAAAGAGGAAGTGGACTACGATCATCGTGCTGCTTACTTCAGACAAATGAAGTATGGTTTGTTCGTCAGAATGGCTTTGTTGGCCATGGTCATGGGTGTTGATATGTGA","protein_sequence":"MATIAPTAPITPPMESTGDRLVTLELKDGTVLQGYSFGAEKSVAGELVFQTGMVGYPESVTDPSYEGQILVITYPLVGNYGVPDMHLRDELVEELPRYFESNRIHIAGLVISHYTDEYSHYLRKSSLGKWLQNEGIPAVYGVDTRSLTKHLRDAGSMLGRLSLEKSGSDRTISRSSSWRSAFDVPEWVDPNVQNLVSKVSINEPKLYVPPADNKHIELQTGPDGKVLRILAIDVGMKYNQIRCFIKRGVELKVVPWNYDFTKEDYDGLFISNGPGDPSVLDDLSQRLSNVLEAKKTPVFGICLGHQLIARAAGASTLKLKFGNRGHNIPCTSTISGRCYITSQNHGFAVDVDTLTSGWKPLFVNANDDSNEGIYHSELPYFSVQFHPESTPGPRDTEFLFDVFIQAVKEFKYTQVLKPIAFPGGLLEDNVKAHPRIEAKKVLVLGSGGLSIGQAGEFDYSGSQAIKALKEEGIYTILINPNIATIQTSKGLADKVYFVPVTAEFVRKVILHERPDAIYVTFGGQTALSVGIAMKDEFEALGVKVLGTPIDTIITTEDRELFSNAIDEINEKCAKSQAANSVDEALAAVKEIGFPVIVRAAYALGGLGSGFANNEKELVDLCNVAFSSSPQVLVEKSMKGWKEVEYEVVRDAFDNCITVCNMENFDPLGIHTGDSIVVAPSQTLSDEDYNMLRTTAVNVIRHLGVVGECNIQYALNPVSKDYCIIEVNARLSRSSALASKATGYPLAYTAAKLGLNIPLNEVKNSVTKSTCACFEPSLDYCVVKMPRWDLKKFTRVSTELSSSMKSVGEVMSIGRTFEEAIQKAIRSTEYANLGFNETDLDIDIDYELNNPTDMRVFAIANAFAKKGYSVDKVWEMTRIDKWFLNKLHDLVQFAEKISSFGTKEELPSLVLRQAKQLGFDDRQIARFLDSNEVAIRRLRKEYGITPFVKQIDTVAAEFPAYTNYLYMTYNADSHDLSFDDHGVMVLGSGVYRIGSSVEFDWCAVTAVRTLRANNIKTIMVNYNPETVSTDYDEADRLYFETINLERVLDIYEIENSSGVVVSMGGQTSNNIAMTLHRENVKILGTSPDMIDSAENRYKFSRMLDQIGVDQPAWKELTSMDEAESFAEKVGYPVLVRPSYVLSGAAMNTVYSKNDLESYLNQAVEVSRDYPVVITKYIENAKEIEMDAVARNGELVMHVVSEHVENAGVHSGDATLIVPPQDLAPETVDRIVVATAKIGKALKITGPYNIQFIAKDNEIKVIECNVRASRSFPFISKVVGVNLIELATKAIMGLPLTPYPVEKLPDDYVAVKVPQFSFPRLAGADPVLGVEMASTGEVATFGHSKYEAYLKSLLATGFKLPKKNILLSIGSYKEKQELLSSVQKLYNMGYKLFATSGTADFLSEHGIAVQYLEVLNKDDDDQKSEYSLTQHLANNEIDLYINLPSANRFRRPASYVSKGYKTRRLAVDYSVPLVTNVKCAKLLIEAISRNITLDVSERDAQTSHRTITLPGLINIATYVPNASHVIKGPAELKETTRLFLESGFTYCQLMPRSISGPVITDVASLKAANSVSQDSSYTDFSFTIAGTAHNAHSVTQSASKVTALFLPLRELKNKITAVAELLNQWPTEKQVIAEAKTADLASVLLLTSLQNRSIHITGVSNKEDLALIMTVKAKDPRVTCDVNIYSLFIAQDDYPEAVFLPTKEDQEFFWNNLDSIDAFSVGALPVALANVTGNKVDVGMGIKDSLPLLLAAVEEGKLTIDDIVLRLHDNPAKIFNIPTQDSVVEIDLDYSFRRNKRWSPFNKDMNGGIERVVYNGETLVLSGELVSPGAKGKCIVNPSPASITASAELQSTSAKRRFSITEEAIADNLDAAEDAIPEQPLEQKLMSSRPPRELVAPGAIQNLIRSNNPFRGRHILSIKQFKRSDFHVLFAVAQELRAAVAREGVLDLMKGHVITTIFFEPSTRTCSSFIAAMERLGGRIVNVNPLVSSVKKGETLQDTIRTLACYSDAIVMRHSEEMSVHIAAKYSPVPIINGGNGSREHPTQAFLDLFTIREEIGTVNGITVTFMGDLKHGRTVHSLCRLLMHYQVRINLVSPPELRLPEGLREELRKAGLLGVESIELTPHIISKTDVLYCTRVQEERFNSPEEYARLKDTYIVDNKILAHAKENMAIMHPLPRVNEIKEEVDYDHRAAYFRQMKYGLFVRMALLAMVMGVDM"},{"created_at":"2011-05-24T19:30:54.000Z","updated_at":"2011-05-29T05:06:11.000Z","name":"Carbamoyl-phosphate synthase arginine-specific large chain","uniprot_id":"P03965","uniprot_name":"CARB_YEAST","enzyme":true,"transporter":false,"gene_name":"CPA2","num_residues":1118,"molecular_weight":"123914.0","theoretical_pi":"4.95","general_function":"Involved in ATP binding","specific_function":"2 ATP + L-glutamine + HCO(3)(-) + H(2)O = 2 ADP + phosphate + L-glutamate + carbamoyl phosphate","reactions":[{"id":2254,"direction":"\u003e","locations":"Cytoplasm","altext":"2 ATP + L-glutamine + HCO(3)(-) + H(2)O = 2 ADP + phosphate + L-glutamate + carbamoyl phosphate.","export":false,"pw_reaction_id":null,"source":null}],"signal_regions":"None","transmembrane_regions":"None","pdb_id":null,"cellular_location":"Cytoplasm","genbank_gene_id":"K01178","genbank_protein_id":"171310","gene_card_id":"CPA2","chromosome_location":"chromosome 10","locus":"YJR109C","synonyms":["Arginine-specific carbamoyl-phosphate synthetase, ammonia chain"],"enzyme_classes":["6.3.5.5"],"go_classes":[{"category":"Component","description":" Not Available"},{"category":"Function","description":" adenyl nucleotide binding"},{"category":"Function","description":" adenyl ribonucleotide binding"},{"category":"Function","description":" ATP binding"},{"category":"Function","description":" carbamoyl-phosphate synthase activity"},{"category":"Function","description":" catalytic activity"},{"category":"Function","description":" ligase activity"},{"category":"Function","description":" ligase activity, forming carbon-nitrogen bonds"},{"category":"Function","description":" binding"},{"category":"Function","description":" nucleoside binding"},{"category":"Function","description":" purine nucleoside binding"},{"category":"Process","description":" metabolic process"},{"category":"Process","description":" nitrogen compound metabolic process"}],"pfams":[{"name":"CPSase_L_chain","identifier":"PF00289"},{"name":"CPSase_L_D2","identifier":"PF02786"},{"name":"CPSase_L_D3","identifier":"PF02787"},{"name":"MGS","identifier":"PF02142"}],"pathways":[{"name":"Pyrimidine metabolism","kegg_map_id":"00240"},{"name":"Alanine, aspartate and glutamate metabolism","kegg_map_id":"00250"}],"gene_sequence":"ATGACATCGATTTATACATCAACAGAGCCTACGAATTCTGCTTTTACTACCGAGGACTACAAACCTCAATTAGTTGAAGGAGTAAATTCTGTACTTGTCATTGGATCAGGAGGGCTCTCTATTGGTCAAGCTGGTGAATTCGATTACAGTGGTTCTCAAGCTATCAAAGCTCTGAAGGAAGATAACAAGTTTACTATATTGGTTAACCCAAATATCGCTACTAACCAGACTTCTCATTCCCTGGCGGACAAGATTTATTACTTGCCCGTTACACCAGAATACATCACATATATCATTGAACTTGAAAGGCCGGATGCTATACTTTTAACCTTCGGTGGTCAAACAGGTCTAAATTGTGGGGTGGCTCTGGATGAATCTGGTGTTTTGGCTAAATACAACGTCAAAGTTTTAGGTACTCCTATCAAAACTTTGATCACTTCTGAAGATAGGGATCTTTTCGCATCTGCGTTAAAGGATATCAACATTCCCATCGCAGAATCATTTGCTTGTGAAACCGTGGATGAAGCTTTGGAGGCTGCTGAAAGGGTCAAATACCCAGTTATTGTCAGATCTGCATACGCTTTGGGTGGGTTAGGCTCAGGTTTCGCTAACAATGCAAGTGAAATGAAGGAACTTGCCGCACAGTCCTTGTCGTTGGCCCCACAAATTCTTGTTGAAAAATCTTTGAAAGGTTGGAAAGAAGTTGAATATGAAGTGGTCAGAGATAGGGTTGGTAACTGTATTACAGTATGTAATATGGAAAATTTCGACCCACTTGGTGTTCATACTGGTGATTCTATGGTTTTTGCTCCTTCGCAGACCCTATCAGATGAAGAGTTTCATATGTTAAGATCCGCCGCAATTAAAATCATTAGACACCTTGGTGTTATTGGTGAATGTAATGTCCAATACGCTTTGCAACCTGATGGGCTAGACTATAGAGTTATTGAAGTGAACGCACGTTTATCTCGTTCCTCTGCATTGGCGTCTAAGGCCACTGGTTATCCCTTAGCATACACTGCCGCCAAAATTGGGCTAGGCTATACTTTGCCAGAATTGCCAAACCCAATCACAAAAACTACAGTGGCTAACTTTGAGCCATCTTTGGATTATATTGTGGCAAAAATACCTAAGTGGGATCTTTCTAAGTTCCAATACGTGGACAGATCCATTGGTTCCTCTATGAAATCAGTTGGAGAAGTTATGGCTATTGGTAGAAACTATGAAGAAGCCTTTCAAAAAGCATTAAGACAGGTGGATCCATCATTATTGGGATTCCAAGGTTCTACTGAATTCGGCGATCAACTTGATGAAGCCTTGAGAACTCCAACTGATAGAAGAGTCCTTGCCATTGGTCAGGCCTTAATCCATGAAAACTATACTGTTGAGAGAGTTAATGAATTGAGTAAAATTGATAAATGGTTTCTTTACAAGTGCATGAACATTGTTAATATCTATAAAGAGCTTGAATCAGTTAAATCTTTAAGTGACTTGAGTAAAGATCTCTTGCAGAGAGCCAAGAAATTAGGGTTTTCAGATAAGCAGATTGCGGTTACTATAAATAAACACGCCTCCACAAACATTAACGAACTGGAAATCAGAAGTTTAAGAAAAACGTTAGGTATAATCCCTTTTGTCAAGAGAATCGATACTTTGGCCGCAGAATTTCCAGCACAAACCAATTATTTGTATACCACTTACAATGCTACAAAGAACGATGTGGAGTTCAACGAAAATGGTATGCTGGTTTTAGGCTCTGGTGTCTATCGTATTGGTTCATCTGTAGAATTTGATTGGTGTGCCGTGAACACCGCGAAGACATTAAGAGATCAAGGCAAGAAAACTATCATGATAAATTATAACCCAGAAACAGTTTCCACAGATTTCGATGAAGTTGATAGATTATACTTTGAAGAATTATCGTATGAAAGAGTGATGGACATTTATGAGTTGGAGCAATCTGAGGGTTGCATTATTTCTGTCGGTGGTCAATTACCTCAAAACATTGCCTTGAAACTTTACGATAACGGCTGTAATATAATGGGTACCAATCCAAACGATATTGATAGAGCTGAGAACAGACACAAATTCTCATCTATTTTGGATTCTATTGATGTTGACCAACCTGAATGGAGTGAATTAACATCAGTAGAAGAAGCAAAATTATTTGCTTCTAAAGTTAACTACCCTGTGTTGATTCGTCCCTCATATGTTCTTTCCGGTGCGGCAATGAGTGTTGTTAATAATGAGGAGGAACTGAAGGCTAAATTAACTTTGGCATCTGACGTTTCTCCAGACCATCCAGTCGTCATGTCTAAATTTATTGAAGGTGCTCAAGAAATTGATGTGGACGCCGTTGCTTATAATGGTAATGTCTTGGTACATGCCATTTCCGAGCATGTTGAAAATGCGGGTGTGCACTCCGGTGATGCTTCTTTAGTCTTACCGCCACAACATCTTTCTGACGATGTGAAGATTGCCCTAAAAGACATTGCTGATAAGGTCGCAAAAGCTTGGAAGATCACTGGCCCCTTCAATATGCAAATCATCAAGGATGGGGAGCATACATTGAAAGTGATTGAATGTAACATTAGAGCTTCTAGATCATTTCCATTCGTTTCAAAAGTTTTAGGCGTTAATTTTATTGAAATTGCTGTCAAGGCATTTTTGGGCGGTGACATTGTACCAAAACCTGTTGATTTGATGCTCAACAAAAAGTACGACTATGTTGCTACTAAAGTTCCTCAATTTTCCTTTACAAGGTTGGCTGGTGCAGATCCTTTCTTAGGGGTTGAAATGGCATCAACTGGTGAAGTTGCTTCATTTGGTAGAGATTTAATTGAAAGCTATTGGACTGCTATTCAAAGTACCATGAACTTCCATGTACCACTACCTCCAAGTGGTATATTATTTGGAGGTGATACATCTCGAGAATACTTGGGCCAAGTGGCTTCCATAGTGGCCACTATTGGTTACAGAATATACACAACTAATGAGACCACTAAAACGTATCTACAGGAACACATCAAAGAAAAGAACGCAAAGGTTTCTTTGATTAAATTTCCAAAGAATGATAAGAGAAAATTGCGTGAACTATTTCAAGAATATGACATAAAAGCTGTTTTCAATTTAGCCTCCAAGAGAGCTGAGAGCACTGACGATGTTGACTATATTATGAGAAGGAATGCTATTGATTTTGCTATCCCATTGTTCAATGAACCTCAAACGGCTTTGTTATTTGCAAAGTGTTTGAAGGCAAAAATTGCAGAAAAGATCAAAATTTTGGAATCTCATGACGTTATAGTTCCACCAGAAGTCCGTTCCTGGGATGAATTTATTGGTTTCAAAGCATATTGA","protein_sequence":"MTSIYTSTEPTNSAFTTEDYKPQLVEGVNSVLVIGSGGLSIGQAGEFDYSGSQAIKALKEDNKFTILVNPNIATNQTSHSLADKIYYLPVTPEYITYIIELERPDAILLTFGGQTGLNCGVALDESGVLAKYNVKVLGTPIKTLITSEDRDLFASALKDINIPIAESFACETVDEALEAAERVKYPVIVRSAYALGGLGSGFANNASEMKELAAQSLSLAPQILVEKSLKGWKEVEYEVVRDRVGNCITVCNMENFDPLGVHTGDSMVFAPSQTLSDEEFHMLRSAAIKIIRHLGVIGECNVQYALQPDGLDYRVIEVNARLSRSSALASKATGYPLAYTAAKIGLGYTLPELPNPITKTTVANFEPSLDYIVAKIPKWDLSKFQYVDRSIGSSMKSVGEVMAIGRNYEEAFQKALRQVDPSLLGFQGSTEFGDQLDEALRTPTDRRVLAIGQALIHENYTVERVNELSKIDKWFLYKCMNIVNIYKELESVKSLSDLSKDLLQRAKKLGFSDKQIAVTINKHASTNINELEIRSLRKTLGIIPFVKRIDTLAAEFPAQTNYLYTTYNATKNDVEFNENGMLVLGSGVYRIGSSVEFDWCAVNTAKTLRDQGKKTIMINYNPETVSTDFDEVDRLYFEELSYERVMDIYELEQSEGCIISVGGQLPQNIALKLYDNGCNIMGTNPNDIDRAENRHKFSSILDSIDVDQPEWSELTSVEEAKLFASKVNYPVLIRPSYVLSGAAMSVVNNEEELKAKLTLASDVSPDHPVVMSKFIEGAQEIDVDAVAYNGNVLVHAISEHVENAGVHSGDASLVLPPQHLSDDVKIALKDIADKVAKAWKITGPFNMQIIKDGEHTLKVIECNIRASRSFPFVSKVLGVNFIEIAVKAFLGGDIVPKPVDLMLNKKYDYVATKVPQFSFTRLAGADPFLGVEMASTGEVASFGRDLIESYWTAIQSTMNFHVPLPPSGILFGGDTSREYLGQVASIVATIGYRIYTTNETTKTYLQEHIKEKNAKVSLIKFPKNDKRKLRELFQEYDIKAVFNLASKRAESTDDVDYIMRRNAIDFAIPLFNEPQTALLFAKCLKAKIAEKIKILESHDVIVPPEVRSWDEFIGFKAY"},{"created_at":"2011-05-26T16:52:31.000Z","updated_at":"2011-05-27T15:01:01.000Z","name":"Ornithine carbamoyltransferase","uniprot_id":"P05150","uniprot_name":"OTC_YEAST","enzyme":true,"transporter":false,"gene_name":"ARG3","num_residues":338,"molecular_weight":"37844.80078","theoretical_pi":"6.24","general_function":"Involved in carboxyl- or carbamoyltransferase activity","specific_function":"Carbamoyl phosphate + L-ornithine = phosphate + L-citrulline","reactions":[{"id":1804,"direction":"\u003e","locations":"cytoplasm","altext":null,"export":true,"pw_reaction_id":null,"source":null},{"id":2450,"direction":"\u003e","locations":"Cytoplasm","altext":"Carbamoyl phosphate + L-ornithine = phosphate + L-citrulline.","export":false,"pw_reaction_id":null,"source":null}],"signal_regions":"None","transmembrane_regions":"None","pdb_id":null,"cellular_location":"Cytoplasm","genbank_gene_id":"M11946","genbank_protein_id":"171075","gene_card_id":"ARG3","chromosome_location":"chromosome 10","locus":"YJL088W","synonyms":["Ornithine transcarbamylase","OTCase"],"enzyme_classes":["2.1.3.3"],"go_classes":[{"category":"Component","description":" macromolecular complex"},{"category":"Component","description":" protein complex"},{"category":"Component","description":" ornithine carbamoyltransferase complex"},{"category":"Function","description":" amino acid binding"},{"category":"Function","description":" carboxyl- or carbamoyltransferase activity"},{"category":"Function","description":" ornithine carbamoyltransferase activity"},{"category":"Function","description":" catalytic activity"},{"category":"Function","description":" transferase activity"},{"category":"Function","description":" transferase activity, transferring one-carbon groups"},{"category":"Function","description":" binding"},{"category":"Function","description":" carboxylic acid binding"},{"category":"Process","description":" metabolic process"},{"category":"Process","description":" cellular metabolic process"},{"category":"Process","description":" cellular amino acid and derivative metabolic process"},{"category":"Process","description":" cellular amino acid metabolic process"}],"pfams":[{"name":"OTCace","identifier":"PF00185"},{"name":"OTCace_N","identifier":"PF02729"}],"pathways":[{"name":"Arginine and proline metabolism","kegg_map_id":"00330"}],"gene_sequence":"ATGTCAACCACAGCATCCACGCCTTCATCTTTACGTCATTTGATTTCTATAAAAGATCTTTCTGATGAAGAATTCAGAATCTTAGTACAAAGAGCTCAACATTTCAAGAATGTTTTTAAAGCAAATAAAACGAATGATTTCCAATCCAACCATCTGAAACTATTGGGTAGAACTATAGCCTTAATATTTACTAAAAGATCAACTAGAACGAGAATTTCGACCGAAGGTGCAGCCACCTTCTTTGGTGCCCAACCGATGTTTTTAGGTAAAGAGGATATTCAGCTTGGTGTCAATGAATCATTTTACGATACCACCAAGGTTGTATCATCTATGGTTTCATGTATTTTTGCCCGTGTGAACAAACATGAAGACATACTTGCTTTTTGCAAGGATTCCTCTGTACCGATCATCAACTCTCTATGTGACAAATTCCACCCTTTGCAAGCAATTTGTGATCTTTTAACAATAATCGAAAACTTCAATATATCTCTAGATGAAGTAAATAAGGGAATCAATTCAAAATTGAAGATGGCATGGATTGGTGATGCCAATAATGTCATAAATGATATGTGCATCGCATGTCTGAAATTCGGTATAAGTGTCAGTATTTCCACTCCCCCCGGTATTGAAATGGATTCCGATATTGTCGATGAAGCAAAGAAAGTTGCTGAGAGAAACGGTGCGACATTTGAATTAACACACGACTCTTTAAAGGCCTCCACCAATGCCAATATATTAGTAACCGATACTTTCGTTTCCATGGGTGAAGAATTTGCGAAACAGGCCAAGCTGAAACAATTCAAAGGTTTTCAAATCAATCAAGAACTTGTCTCTGTGGCTGATCCAAACTACAAATTTATGCATTGTCTGCCAAGACATCAAGAAGAAGTTAGTGATGATGTCTTTTATGGAGAGCATTCCATAGTCTTTGAAGAAGCAGAAAACAGATTATATGCAGCTATGTCTGCCATTGATATCTTTGTTAATAATAAAGGTAATTTCAAGGACTTGAAATAA","protein_sequence":"MSTTASTPSSLRHLISIKDLSDEEFRILVQRAQHFKNVFKANKTNDFQSNHLKLLGRTIALIFTKRSTRTRISTEGAATFFGAQPMFLGKEDIQLGVNESFYDTTKVVSSMVSCIFARVNKHEDILAFCKDSSVPIINSLCDKFHPLQAICDLLTIIENFNISLDEVNKGINSKLKMAWIGDANNVINDMCIACLKFGISVSISTPPGIEMDSDIVDEAKKVAERNGATFELTHDSLKASTNANILVTDTFVSMGEEFAKQAKLKQFKGFQINQELVSVADPNYKFMHCLPRHQEEVSDDVFYGEHSIVFEEAENRLYAAMSAIDIFVNNKGNFKDLK"}]}