1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310
|
import coot
import coot_utils
import coot_contact_score_isolated_ligand
def get_metrics_for_ligand(imol, chain_id, res_no, ins_code,
refmac_input_mtz_file_name,
fobs_col, sig_fobs_col, rfree_col,
refmac_dir):
"""
Args:
refmac_dir: the dir where input/output refmac files should be written.
Return:
[correlation, mogul, bumps, difference_map_stats, b_factor_info]
where:
mogul: is either a list [mogul_z_worst, mogul_out_file_name] or an
error status
difference_map_stats:
the output of map_to_model_correlation_stats_py
[correlation, var_x, var_y, n, sum_x, sum_y, D, D2 (based on mean/sd of the map at the ligand)
map_mean map_mean_at_ligand map_sd map_sd_at_ligand )
b_factor_info:
[median_ratio median_ligand mediand_-env ks_testd_-result]
"""
def local_refmac(stub_name):
ligand_spec = [chain_id, res_no, ins_code]
neighbs = coot.residues_near_residue_py(imol, ligand_spec, 4)
rn = coot.residue_name(imol, chain_id, res_no, ins_code)
n_ligand_atoms = coot.het_group_n_atoms(rn)
if (not coot_utils.isNumber(n_ligand_atoms)):
print("BL ERROR:: failed liagnd atoms not a number.")
return False
else:
refmac_out_sfs_file_name = os.path.join(refmac_dir, \
stub_name + "-with-ligand-refmac.mtz")
with_ligand_pdb_file_name = os.path.join(refmac_dir, \
stub_name + "-with-ligand.pdb")
coot.make_directory_maybe(refmac_dir)
coot.make_directory_maybe("coot-refmac") # XYZOUT goes here
coot.write_pdb_file(imol, with_ligand_pdb_file_name)
r = get_recent_pdbe.refmac_calc_sfs_make_mtz_with_columns(with_ligand_pdb_file_name,
refmac_input_mtz_file_name,
refmac_out_sfs_file_name,
fobs_col, sig_fobs_col, rfree_col)
if not r:
print("BL ERROR:: failed calculating sfs in refmac")
return False
else:
# happy path
return refmac_out_sfs_file_name
# get_correlation at the ligand for the direct (FWT) map
#
def get_correlation(stub_name):
global refmac_extra_params
refmac_extra_params = ["refine exclude all from " + \
str(res_no) + " " + \
chain_id + " to " + \
str(res_no) + " " + \
chain_id]
print("BL DEBUG:: in get_correlation(): refmac_extra_params:", refmac_extra_params)
ligand_spec = [chain_id, res_no, ins_code]
refmac_out_sfs_file_name = local_refmac(stub_name)
if not refmac_out_sfs_file_name:
return False
else:
# happy path
imol_map = coot.make_and_draw_map(refmac_out_sfs_file_name, "FWT", "PHWT", "", 0, 0)
neighbs = coot.residues_near_residue_py(imol, ligand_spec, 4)
c = coot.map_to_model_correlation(imol, [ligand_spec], neighbs, 0, imol_map)
coot.close_molecule(imol_map)
return c
# return False or a list of stats.
#
def get_ligand_difference_map_stats(stub_name):
global refmac_extra_params
refmac_extra_params = False # reset - no ligand exclusion
refmac_out_sfs_file_name = local_refmac(stub_name + "-for-ligand-diff-map")
ligand_spec = [chain_id, res_no, ins_code]
neighbs = coot.residues_near_residue_py(imol, ligand_spec, 4)
if not refmac_out_sfs_file_name:
return False
else:
# happy path
imol_map = coot.make_and_draw_map(refmac_out_sfs_file_name,
"DELFWT", "PHDELWT", "", 0, 1)
# now do some stats on the map at the ligand site
c = coot.map_to_model_correlation_stats_py(imol, [ligand_spec],
neighbs, 10, imol_map)
print("BL INFO:: residue %s density statistics %s!" \
%(ligand_spec, c))
return c
# Return an error status (False, i.e. not a list) or a list
# [mogul_z_worst, mogul_out_file_name] on success.
#
# (PE note: we want the filename so that we can show mogul markup
# on the ligand when we activate this function from the gui)
def get_mogul_score(use_cache_qm):
# if run_result is a list it contains the mogul-output file name
# if it is False something went wrong
#
run_result = run_mogul("BONDS_AND_ANGLES", imol, chain_id,
res_no, ins_code,
"ligand-check", use_cache_qm)
print("BL DEBUG:: run_results (mogul): ", chain_id, res_no, run_result)
if not run_result:
return False
else:
# happy path
if use_cache_qm:
# return a random mogul_score
return [123, run_result]
mogul_results_list = coot.mogul_results_py(run_result)
if (not isinstance(mogul_results_list, list)):
return False
else:
if (len(mogul_results_list) == 0):
mogul_score = "MOGUL_NO_STATS"
else:
mogul_score = max(mogul_results_list)
return [mogul_score, run_result]
def get_ligand_dictionary_based_geometry_stats():
ligand_spec = [chain_id, res_no, ins_code]
summary_info = get_ligand_distortion_summary_info(imol, ligand_spec)
print("##### we got summary-info", summary_info)
return summary_info
# return a list: n_bad_overlaps n_hydrogen_bonds n_small_overlaps n_close_contacts n_wide_contacts
#
def get_bump_score():
ligand_spec = [chain_id, res_no, ins_code]
cs = coot_contact_score_isolated_ligand.contact_score_ligand(imol, ligand_spec)
coot.graphics_draw()
return cs
# return a list of [median_ratio, median_ligand, mediand_-env, ks_test_result]
# stub_name is only passed so that we can write diagnostics to standard-out.
#
def get_b_factor_distribution_metrics(stub_name):
def median_ratio(ligand_b_factors, env_b_factors):
# maybe the second one should include the ligand Bs?!
return median(ligand_b_factors) / median(env_b_factors)
def filter_out_waters(imol, env_residues):
def is_not_water(residue_item):
rn = coot.residue_name(imol,
res_spec_utils.residue_spec_to_chain_id(residue_item),
res_spec_utils.residue_spec_to_res_no(residue_item),
coot_utils.residue_spec_to_ins_code(residue_item))
return (rn != "HOH" and rn != "WAT")
return [res_item for res_item in env_residues if is_not_water(res_item)]
# from http://stackoverflow.com/questions/24101524/finding-median-of-list-in-python
def median(lst):
lst = sorted(lst)
if len(lst) < 1:
return None
if len(lst) %2 == 1:
return lst[((len(lst)+1)//2)-1]
else:
return float(sum(lst[(len(lst)//2)-1:(len(lst)//2)+1]))/2.0
# Return a list of length 2:
# The first item is a list of atoms for the residue specified by ligand-spec
# It may be False, in which case this function failed to return a result
# If it is not False, the 2nd is a list of atom b-factors
#
def ligand_environment_temperature_factors(imol, ligand_spec, radius):
atoms = residue_info(imol,
res_spec_utils.residue_spec_to_chain_id(ligand_spec),
res_spec_utils.residue_spec_to_res_no(ligand_spec),
coot_utils.residue_spec_to_ins_code(ligand_spec))
env_residues = coot.residues_near_residue_py(imol, ligand_spec, radius)
non_water_env_residues = filter_out_waters(imol, env_residues)
env_residues = [residue_info(imol,
res_spec_utils.residue_spec_to_chain_id(res_spec),
res_spec_utils.residue_spec_to_res_no(res_spec),
coot_utils.residue_spec_to_ins_code(res_spec)) for res_spec in non_water_env_residues]
# this is a list of residue info not atoms, so flatten
env_atoms = []
list(map(env_atoms.extend, env_residues))
if isinstance(atoms, list):
r1 = [atom[1][1][0] \
if isinstance(atom[1][1], list) \
else atom[1][1] for atom in atoms]
else:
r1 = False
if env_atoms:
r2 = [atom[1][1][0] \
if isinstance(atom[1][1], list) \
else atom[1][1] for atom in env_atoms]
else:
r2 = False
return [r1, r2]
# main line of get_b_factor_distribution_metrics
#
ligand_spec = [chain_id, res_no, ins_code]
lig_env_temp_factors = ligand_environment_temperature_factors(imol, ligand_spec, 5)
if not isinstance(lig_env_temp_factors, list):
print("Ligand env temp factors not a list\n")
return False
if len(lig_env_temp_factors[1]) == 0:
print("WARNING:: No values in Ligand env temp factors\n")
return False
v1 = lig_env_temp_factors[0]
v2 = lig_env_temp_factors[1]
print("b-factor kolmogorov-smirnov lig:", stub_name, ligand_spec, v1)
print("b-factor kolmogorov-smirnov env:", stub_name, ligand_spec, v2)
temp_factor_median_ratio = median_ratio(v1, v2)
kolmogorov_smirnov_result = kolmogorov_smirnov(v1, v2)
return [temp_factor_median_ratio, median(v1), median(v2),
kolmogorov_smirnov]
# main line of get_metrics_for_ligand
#
stub_name = molecule_name_stub(imol, 0)
b_factor_info = get_b_factor_distribution_metrics(stub_name)
print("DEBUG:: ####################### b-factor-info:", b_factor_info)
# add error checking to this (maybe more?!)
#
cor = get_correlation(stub_name)
if (coot_utils.isNumber(cor)):
dms = get_ligand_difference_map_stats(stub_name)
if (not isinstance(dms, list)):
return False # error
else:
mog = get_mogul_score(False) # use cache for testing only
if mog:
bmp = get_bump_score()
if (isinstance(bmp, list)):
return [cor, mog, bmp, dms, b_factor_info]
else:
return False
else:
return False
else:
return False
# remove residues that are waters from env-residues
#
def filter_out_waters(imol, env_residues):
def is_not_water(residue_item):
rn = residue_name(imol,
residue_spec_to_chain_id(residue_item),
residue_spec_to_res_no(residue_item),
residue_spec_to_ins_code(residue_item))
return (rn != "HOH" and rn != "WAT")
return [res_item for res_item in env_residues if is_not_water(res_item)]
# the Yes/No tick/cross dialog
#
def gui_ligand_check_dialog_wrapper(imol, imol_map, ligand_spec):
neighbs = []
correl = coot.map_to_model_correlation_py(imol, [ligand_spec], neighbs, 0, imol_map)
cs = coot_contact_score_isolated_ligand.contact_score_ligand(imol, ligand_spec)
n_bumps = -1
if cs:
n_bumps = cs[0]
geom_dist_max = 1.1
ligand_metrics = [correl, geom_dist_max, n_bumps]
percentile_limit = 0.5 # it's a fraction
coot.gui_ligand_metrics_py(ligand_spec, ligand_metrics, percentile_limit)
# the Yes/No tick/cross dialog
def gui_ligand_check_dialog_active_residue():
with coot_utils.UsingActiveAtom(True) as [aa_imol, aa_chain_id, aa_res_no,
aa_ins_code, aa_atom_name, aa_alt_conf, aa_res_spec]:
gui_ligand_check_dialog_wrapper(aa_imol, coot.imol_refinement_map(), aa_res_spec)
def run_mogul(mode, imol, chain_id, res_no, ins_code, prefix_str, use_cache_qm):
# dummy since I cannot test mogul
# will return bogus info for now.
if use_cache_qm:
# for testing return a random Z and random file name
return [2, "dummy"]
else:
return False
|