aa_dict={"V": "valine", "VAL": "valine", "Y": "tyrosine", "TYR": "tyrosine", "T": "threonine", "THR": "threonine", "S": "serine", "SER": "serine", "P": "proline", "PRO": "proline", "F": "phenylalanine", "PHE": "phenylalanine", "M": "methionine", "MET": "methionine", "K": "lysine", "LYS": "lysine", "L": "leucine", "LEU": "leucine", "I": "isoleucine", "ILE": "isoleucine", "A": "alanine", "ALA": "alanine", "R": "arginine", "ARG": "arginine", "N": "asparagine", "ASN": "asparagine", "D": "asparticacid", "ASP": "asparticacid", "C": "cysteine", "CYS": "cysteine", "Q": "glutamine", "GLN": "glutamine", "E": "glutamicacid", "GLU": "glutamicacid", "H": "histidine", "HIS": "histidine", "W": "tryptophan", "TRP": "tryptophan", "G": "glycine", "GLY": "glycine"} amino_acid_proper = {"V": "Mass(-H2O)=99.133, Side Chain= CH3-CH(CH3)-, Occurence(%)=6.48, no charge, hydrophobic", "VAL": "Mass(-H2O)=99.133, Side Chain= CH3-CH(CH3)-, Occurence (%)=6.48, no charge, hydrophobic", "Y": "Mass(-H2O)=163.176, Side Chain= 4-OH-Phenyl-CH2-, Occurence(%)=3.25, weak charge, absorbs UV, hydrogen bonding, not hydrophilic", "TYR": "Mass(-H2O)=163.176, Side Chain= 4-OH-Phenyl-CH2-, Occurence(%)=3.25, weak charge, absorbs UV, hydrogen bonding, not hydrophilic", "T": "Mass(-H2O)=101.105, Side Chain= CH3-CH(OH)-, Occurence(%)=5.96, no charge, hydrogen bonding, hydrophilic", "THR": "Mass(-H2O)=101.105, Side Chain=CH3-CH(OH)-, Occurence(%)=5.96, no charge, hydrogen bonding, hydrophilic", "S": "Mass(-H2O)=87.078, Side Chain= HO-CH2-, Occurence(%)=7.34, no charge, hydrogen bonding, hydrophilic", "SER": "Mass(-H2O)=87.078, Side Chain=HO-CH2-, Occurence(%)=7.34, no charge, hydrogen bonding, hydrophilic", "P": "Mass(-H2O)=97.117, Side Chain= -N-(CH2)3-CH-, Occurence(%)=5.12, no charge, promotes turns, not hydrophobic", "PRO": "Mass(-H2O)=97.117, Side Chain= -N-(CH2)3-CH-, Occurence(%)=5.12, no charge, promotes turns, not hydrophobic", "F": "Mass(-H2O)=147.177, Side Chain= Phenyl-CH2-, Occurence(%)=3.91, no charge, absorbs UV, hydrophobic", "PHE": "Mass(-H2O)=147.177, Side Chain= Phenyl-CH2-, Occurence(%)=3.91, no charge, absorbs UV, hydrophobic", "M": "Mass(-H2O)=131.199, Side Chain= CH3-S-(CH2)2-, Occurence(%)=2.27, initiator of proteins, no charge, hydrophobic", "MET": "Mass(-H2O)=131.199, Side Chain= CH3-S-(CH2)2-, Occurence(%)=2.27, initiator of proteins, no charge, hydrophobic", "K": "Mass(-H2O)=128.17, Side Chain= H2N-(CH2)4-, Occurence(%)=5.82, amine in side chain, basic, reactive, strong positive charge, hydrophilic", "LYS": "Mass(-H2O)=128.17, Side Chain= H2N-(CH2)4-, Occurence(%)=5.82, amine in side chain, basic, reactive, strong positive charge, hydrophilic", "L": "Mass(-H2O)=13.160, Side Chain= (CH3)2-CH-CH2-, Occurence(%)=9.06, no charge, isomer of isoleucine, hydrophobic", "LEU": "Mass(-H2O)=13.160, Side Chain= (CH3)2-CH-CH2-, Occurence(%)=9.06, no charge, isomer of isoleucine, hydrophobic", "I": "Mass(-H2O)=113.160, Side Chain= CH3-CH2-CH(CH3)-, Occurence(%)=5.45, no charge, isomer of leucine, hydrophobic", "ILE": "Mass(-H2O)=113.160, Side Chain= CH3-CH2-CH(CH3)-, Occurence(%)=5.45, no charge, isomer of leucine, hydrophobic", "A": "Mass(-H2O)=71.079, Side Chain= CH3-, Occurence(%)=7.49, smallest amino acid, no charge, hydrophobic", "ALA": "Mass(-H2O)=71.079, Side Chain= CH3-, Occurence(%)=7.49, smallest amino acid, no charge, hydrophobic", "R": "Mass(-H2O)=156.188, Side Chain= HN=C(NH2)-NH-(CH2)3-, Occurence(%)=5.22, guanidinium side chain, basic, strongest positive charge, hydrophilic", "ARG": "Mass(-H2O)=156.188, Side Chain= HN=C(NH2)-NH-(CH2)3-, Occurence(%)=5.22, guanidinium side chain, basic, strongest positive charge, hydrophilic", "N": "Mass(-H2O)=114.104, Side Chain= H2N-CO-CH2-, Occurence(%)=4.53, amide of Asp, hydrogen bonding, no charge, hydrophilic", "ASN": "Mass(-H2O)=114.104, Side Chain= H2N-CO-CH2-, Occurence(%)=4.53, amide of Asp, hydrogen bonding, no charge, hydrophilic", "D": "Mass(-H2O)=115.089, Side Chain= HOOC-CH2-, Occurence(%)=5.22, acidic, negative charge, hydrophilic", "ASP": "Mass(-H2O)=115.089, Side Chain= HOOC-CH2-, Occurence(%)=5.22, acidic, negative charge, hydrophilic", "C": "Mass(-H2O)=103.145, Side Chain= HS-CH2-, Occurence(%)=1.82, Sulfur analog of Ser, weak charge, forms disulfide bonds, not hydrophilic", "CYS": "Mass(-H2O)=103.145, Side Chain= HS-CH2-, Occurence(%)=1.82, Sulfur analog of Ser, weak charge, forms disulfide bonds, not hydrophilic", "Q": "Mass(-H2O)=128.131, Side Chain= H2N-CO-(CH2)2-, Occurence(%)=4.11, amide of Glu, hydrogen bonding, no charge, hydrophilic", "GLN": "Mass(-H2O)=128.131, Side Chain= H2N-CO-(CH2)2-, Occurence(%)=4.11, amide of Glu, hydrogen bonding, no charge, hydrophilic", "E": "Mass(-H2O)=129.116, Side Chain= HOOC-(CH2)2-, Occurence(%)=6.26, acidic, negative charge, hydrophilic", "GLU": "Mass(-H2O)=129.116, Side Chain= HOOC-(CH2)2-, Occurence(%)=6.26, acidic, negative charge, hydrophilic", "H": "Mass(-H2O)=137.141, Side Chain= N=CH-NH-CH=C-CH2-, Occurence(%)=2.23, imidizole in side chain, basic, reactive, weak positive charge, hydrophilic", "HIS": "Mass(-H2O)=137.141, Side Chain= N=CH-NH-CH=C-CH2-, Occurence(%)=2.23, imidizole in side chain, basic, reactive, weak positive charge, hydrophilic", "W": "Mass(-H2O)=186.213, Side Chain= Phenyl-NH-CH=C-CH2-, Occurence(%)=1.32, largest amino acid, rarest amino acid, no charge, absorbs UV, hydrogen bonding, hydrophobic", "TRP": "Mass(-H2O)=186.213, Side Chain= Phenyl-NH-CH=C-CH2-, Occurence(%)=1.32, largest amino acid, rarest amino acid, no charge, absorbs UV, hydrogen bonding, hydrophobic", "G": "Mass(-H2O)=57.052, Side Chain= H-, Occurence(%)=7.10, smallest amino acid, no charge, not hydrophilic", "GLY": "Mass(-H2O)=57.052, Side Chain= H-, Occurence(%)=7.10, smallest amino acid, no charge, not hydrophilic"}