GlobalChem Protein
from global_chem_extensions import GlobalChemExtensions
bioinformatics = GlobalChemExtensions().bioinformatics()Last updated
from global_chem_extensions import GlobalChemExtensions
bioinformatics = GlobalChemExtensions().bioinformatics()Last updated
gc_protein = bioinformatics.initialize_globalchem_protein(
peptide_sequence='AAAA',
)<PandasPDB> Objectsmiles_protein = gc_protein.convert_to_smiles(
mark_nitrogen_backbone=False,
mark_carbonyl_carbon_backbone = False,
)
print (smiles_protein)[N:1]C(C)C([N:1]C(C)C([N:1]C(C)C([N:1]C(C)C([N:1]CC(O)=O)=O)=O)=O)=Osmarts_protein = gc_protein.convert_to_smarts(
mark_nitrogen_backbone=False,
mark_carbonyl_carbon_backbone = False,
)
print (smarts_protein)[#7:1]-[#6](-[#6])-[#6](-[#7:1]-[#6](-[#6])-[#6](-[#7:1]-[#6](-[#6])-[#6](-[#7:1]-[#6](-[#6])-[#6](-[#7:1]-[#6]-[#6](-[#8])=[#8])=[#8])=[#8])=[#8])=[#8]smiles_molecule = gc_protein.convert_ligand_to_smiles()CS(=O)(=O)N1CCOC(C1)c2csc(n2)c3ccccc3NC(=O)c4[nH]ccn41.) 80 < molecular weight (Da) < 750
2.) 10 < number of nonhydrogen atoms < 70
3.) Must not contain atoms of types other than
H, C, O, N, F, P, S, Cl, Br, or I
4.) must contain at least one
non-carbon/non-hydrogen atom
5.) must not contain two or more phosphorus atoms
6.) must not have more than 10 rotatable bonds
7.) must not be a nucleic acid
8.) must not be composed only from
non-lead-like PDB-HET-groupsb
9.) must not be covalently bound
10.) must not have protein contacts from the crystal
packing environment in less than 3 Å distance
11.) must have contacts with protein in less than
7Å distancepdb_ids = ['5tc0', '4EHM',]
for pdb in pdb_ids:
gc_protein = gce.initialize_globalchem_protein(
pdb_id='5tc0',
)
criteria_met = gc_protein.determine_bostrom_ligand_criteria(verbose=True)
ligand_smiles = gc_protein.ligand_smiles
print ("Ligand: %s, Criteria Met: %s" % (ligand_smiles, criteria_met))Passed Check 1 Molecular Weight: 433.08784608800005
Passed Check 2 Non Hydrogen Atoms: 29
Passed Check 3 All Atoms Are Within Element Boundaries
Passed Check 4 Non-Hydrogen & Non-Carbon Atoms Present: 11
Passed Check 5 Less than Two Phosphorous atoms Present
Passed Check 6 Less than Ten Rotatable Bonds Present
Passed Check 7 No Nucleic Acid Template Found
Passed Check 9 Not a Covalent Inhibitor
Check 11 Has Contacts within 7 Angstroms
Ligand: CS(=O)(=O)N1CCOC(C1)c2csc(n2)c3ccccc3NC(=O)c4[nH]ccn4, Criteria Met: True
Passed Check 1 Molecular Weight: 358.0688674079999
Passed Check 2 Non Hydrogen Atoms: 26
Passed Check 3 All Atoms Are Within Element Boundaries
Passed Check 4 Non-Hydrogen & Non-Carbon Atoms Present: 8
Passed Check 5 Less than Two Phosphorous atoms Present
Passed Check 6 Less than Ten Rotatable Bonds Present
Passed Check 7 No Nucleic Acid Template Found
Failed Check 9
Passed Check 1 Molecular Weight: 358.0688674079999
Passed Check 2 Non Hydrogen Atoms: 26
Passed Check 3 All Atoms Are Within Element Boundaries
Passed Check 4 Non-Hydrogen & Non-Carbon Atoms Present: 8
Passed Check 5 Less than Two Phosphorous atoms Present
Passed Check 6 Less than Ten Rotatable Bonds Present
Passed Check 7 No Nucleic Acid Template Found
Failed Check 9
Ligand: Cc1cc(c(c2c1C(=O)Oc3c(c(cc(c3O2)C(=O)O)OC)C)C=O)O, Criteria Met: False