dockonsurf / modules / calculation.py @ 78fcb188
Historique | Voir | Annoter | Télécharger (8,98 ko)
1 | 3d6a9d3c | Carles | import os |
---|---|---|---|
2 | 3d6a9d3c | Carles | import logging |
3 | 3d6a9d3c | Carles | |
4 | 3d6a9d3c | Carles | logger = logging.getLogger('DockOnSurf')
|
5 | 3d6a9d3c | Carles | |
6 | 3d6a9d3c | Carles | |
7 | f85667b9 | Carles Marti | def check_finished_calcs(run_type, code): |
8 | f85667b9 | Carles Marti | """Returns two lists of calculations finished normally and abnormally.
|
9 | f85667b9 | Carles Marti |
|
10 | f85667b9 | Carles Marti | @param run_type: The type of calculation to check.
|
11 | f85667b9 | Carles Marti | @param code: The code used for the specified job.
|
12 | f85667b9 | Carles Marti | @return finished_calcs: List of calculations that have finished normally.
|
13 | f85667b9 | Carles Marti | @return unfinished_calcs: List of calculations that have finished abnormally
|
14 | f85667b9 | Carles Marti | """
|
15 | f85667b9 | Carles Marti | from glob import glob |
16 | f85667b9 | Carles Marti | from modules.utilities import tail |
17 | f85667b9 | Carles Marti | |
18 | f85667b9 | Carles Marti | finished_calcs = [] |
19 | f85667b9 | Carles Marti | unfinished_calcs = [] |
20 | f85667b9 | Carles Marti | for conf in os.listdir(run_type): |
21 | f85667b9 | Carles Marti | if not os.path.isdir(f'{run_type}/{conf}') or 'conf_' not in conf: |
22 | f85667b9 | Carles Marti | continue
|
23 | f85667b9 | Carles Marti | if code == 'cp2k': |
24 | f85667b9 | Carles Marti | out_file_list = glob(f"{run_type}/{conf}/*.out")
|
25 | f85667b9 | Carles Marti | restart_file_list = glob(f"{run_type}/{conf}/*-1.restart")
|
26 | f85667b9 | Carles Marti | if len(out_file_list) == 0 or len(restart_file_list) == 0: |
27 | f85667b9 | Carles Marti | unfinished_calcs.append(conf) # TODO specify separetely out and
|
28 | b6b1b03e | Carles Marti | # TODO restart
|
29 | f85667b9 | Carles Marti | elif len(out_file_list) > 1 or len(restart_file_list) > 1: |
30 | f85667b9 | Carles Marti | warn_msg = f'There is more than one file matching the {code} ' \
|
31 | f85667b9 | Carles Marti | f'pattern for finished calculation (*.out / ' \
|
32 | f85667b9 | Carles Marti | f'*-1.restart) in {run_type}/{conf}: ' \
|
33 | f85667b9 | Carles Marti | f'{out_file_list, restart_file_list}. ' \
|
34 | f85667b9 | Carles Marti | f'Skipping directory.'
|
35 | f85667b9 | Carles Marti | logger.warning(warn_msg) |
36 | f85667b9 | Carles Marti | unfinished_calcs.append(conf) |
37 | f85667b9 | Carles Marti | else:
|
38 | f85667b9 | Carles Marti | with open(out_file_list[0], 'rb') as out_fh: |
39 | f85667b9 | Carles Marti | if "PROGRAM STOPPED IN" not in tail(out_fh): |
40 | f85667b9 | Carles Marti | unfinished_calcs.append(conf) |
41 | f85667b9 | Carles Marti | else:
|
42 | f85667b9 | Carles Marti | finished_calcs.append(conf) |
43 | f85667b9 | Carles Marti | return finished_calcs, unfinished_calcs
|
44 | f85667b9 | Carles Marti | |
45 | f85667b9 | Carles Marti | |
46 | 1a158b9f | Carles Marti | def prep_cp2k(inp_file, run_type, atms_list, proj_name): |
47 | f3004731 | Carles | """Prepares the directories to run isolated calculation with CP2K.
|
48 | 3d6a9d3c | Carles |
|
49 | f3004731 | Carles | @param inp_file: CP2K Input file to run the calculations with.
|
50 | f3004731 | Carles | @param run_type: Type of calculation. 'isolated', 'screening' or
|
51 | f3004731 | Carles | 'refinement'
|
52 | f3004731 | Carles | @param atms_list: list of ase.Atoms objects to run the calculation of.
|
53 | 1a158b9f | Carles Marti | @param proj_name: name of the project
|
54 | f3004731 | Carles | @return: None
|
55 | f3004731 | Carles | """
|
56 | f3004731 | Carles | from shutil import copy |
57 | f3004731 | Carles | import ase.io |
58 | f3004731 | Carles | from pycp2k import CP2K |
59 | af3e2441 | Carles Marti | from modules.utilities import check_bak |
60 | f3004731 | Carles | cp2k = CP2K() |
61 | f3004731 | Carles | cp2k.parse(inp_file) |
62 | 1a158b9f | Carles Marti | cp2k.CP2K_INPUT.GLOBAL.Project_name = proj_name+"_"+run_type
|
63 | f3004731 | Carles | force_eval = cp2k.CP2K_INPUT.FORCE_EVAL_list[0]
|
64 | b05058e1 | Carles | if force_eval.SUBSYS.TOPOLOGY.Coord_file_name is None: |
65 | 2dfa562f | Carles Martí | logger.warning("'COORD_FILE_NAME' not specified on CP2K input. Using\n"
|
66 | f601942f | Carles Marti | "'coord.xyz'. A new CP2K input file with "
|
67 | f601942f | Carles Marti | "the 'COORD_FILE_NAME' variable is created.")
|
68 | b05058e1 | Carles | force_eval.SUBSYS.TOPOLOGY.Coord_file_name = 'coord.xyz'
|
69 | 2dfa562f | Carles Martí | check_bak(inp_file.split('/')[-1]) |
70 | 1a158b9f | Carles Marti | cp2k.write_input_file(inp_file.split('/')[-1]) |
71 | b05058e1 | Carles | |
72 | f3004731 | Carles | coord_file = force_eval.SUBSYS.TOPOLOGY.Coord_file_name |
73 | f3004731 | Carles | |
74 | 99afde40 | Carles | # Creating and setting up directories for every configuration.
|
75 | f3004731 | Carles | for i, conf in enumerate(atms_list): |
76 | f3004731 | Carles | os.mkdir(f'{run_type}/conf_{i}')
|
77 | f3004731 | Carles | copy(inp_file, f'{run_type}/conf_{i}/')
|
78 | f3004731 | Carles | ase.io.write(f'{run_type}/conf_{i}/{coord_file}', conf)
|
79 | f3004731 | Carles | |
80 | f3004731 | Carles | |
81 | 2be92b2c | Carles Marti | def get_jobs_status(job_ids, stat_cmd, stat_dict): |
82 | 670284be | Carles | """Returns a list of job status for a list of job ids.
|
83 | 99afde40 | Carles |
|
84 | 670284be | Carles | @param job_ids: list of all jobs to be checked their status.
|
85 | 2be92b2c | Carles Marti | @param stat_cmd: Command to check job status.
|
86 | 2be92b2c | Carles Marti | @param stat_dict: Dictionary with pairs of job status (r, p, f) and the
|
87 | 2be92b2c | Carles Marti | pattern it matches in the output of the stat_cmd.
|
88 | 670284be | Carles | @return: list of status for every job.
|
89 | 99afde40 | Carles | """
|
90 | 2be92b2c | Carles Marti | from subprocess import PIPE, Popen |
91 | 670284be | Carles | status_list = [] |
92 | 670284be | Carles | for job in job_ids: |
93 | 99c87fcc | Carles Marti | stat_msg = Popen(stat_cmd % job, shell=True,
|
94 | 2be92b2c | Carles Marti | stdout=PIPE).communicate()[0].decode('utf-8').strip() |
95 | 2be92b2c | Carles Marti | if stat_dict['r'] == stat_msg: |
96 | 670284be | Carles | status_list.append('r')
|
97 | 2be92b2c | Carles Marti | elif stat_dict['p'] == stat_msg: |
98 | 2be92b2c | Carles Marti | status_list.append('p')
|
99 | 2be92b2c | Carles Marti | elif stat_dict['f'] == stat_msg: |
100 | b461f289 | Carles Marti | status_list.append('f')
|
101 | b461f289 | Carles Marti | else:
|
102 | 99c87fcc | Carles Marti | logger.warning(f'Unrecognized job {job} status: {stat_msg}')
|
103 | b461f289 | Carles Marti | return status_list
|
104 | b461f289 | Carles Marti | |
105 | b461f289 | Carles Marti | |
106 | 09c3325a | Carles Marti | def submit_jobs(run_type, sub_cmd, sub_script, stat_cmd, stat_dict, max_jobs, |
107 | b6b1b03e | Carles Marti | name): |
108 | 2be92b2c | Carles Marti | """Submits jobs to a custom queuing system with the provided script
|
109 | b461f289 | Carles Marti |
|
110 | b461f289 | Carles Marti | @param run_type: Type of calculation. 'isolated', 'screening', 'refinement'
|
111 | b6b1b03e | Carles Marti | @param sub_cmd: Bash command used to submit jobs.
|
112 | b461f289 | Carles Marti | @param sub_script: script for the job submission.
|
113 | b6b1b03e | Carles Marti | @param stat_cmd: Bash command to check job status.
|
114 | b6b1b03e | Carles Marti | @param stat_dict: Dictionary with pairs of job status: r, p, f (ie. running
|
115 | b6b1b03e | Carles Marti | pending and finished) and the pattern it matches in the output of the
|
116 | b6b1b03e | Carles Marti | stat_cmd.
|
117 | b6b1b03e | Carles Marti | @param max_jobs: dict: Contains the maximum number of jobs to be both
|
118 | b6b1b03e | Carles Marti | running, pending/queued and pending+running. When the relevant maximum
|
119 | b6b1b03e | Carles Marti | is reached no jobs more are submitted.
|
120 | 2be92b2c | Carles Marti | @param name: name of the project.
|
121 | b461f289 | Carles Marti | """
|
122 | b461f289 | Carles Marti | from shutil import copy |
123 | b461f289 | Carles Marti | from time import sleep |
124 | 2be92b2c | Carles Marti | from subprocess import PIPE, Popen |
125 | b461f289 | Carles Marti | subm_jobs = [] |
126 | b461f289 | Carles Marti | init_dir = os.getcwd() |
127 | b461f289 | Carles Marti | for conf in os.listdir(run_type): |
128 | b461f289 | Carles Marti | i = conf.split('_')[1] |
129 | b6b1b03e | Carles Marti | while get_jobs_status(subm_jobs, stat_cmd, stat_dict).count("r") + \ |
130 | b6b1b03e | Carles Marti | get_jobs_status(subm_jobs, stat_cmd, stat_dict).count("p") \
|
131 | b6b1b03e | Carles Marti | >= max_jobs['rp']\
|
132 | b6b1b03e | Carles Marti | or get_jobs_status(subm_jobs, stat_cmd, stat_dict).count("r") \ |
133 | b6b1b03e | Carles Marti | >= max_jobs['r'] \
|
134 | b6b1b03e | Carles Marti | or get_jobs_status(subm_jobs, stat_cmd, stat_dict).count("p") \ |
135 | b6b1b03e | Carles Marti | >= max_jobs['p']:
|
136 | b461f289 | Carles Marti | sleep(30)
|
137 | b461f289 | Carles Marti | copy(sub_script, f"{run_type}/{conf}")
|
138 | b461f289 | Carles Marti | os.chdir(f"{run_type}/{conf}")
|
139 | ca309a2c | Carles Marti | job_name = f'{name[:5]}{run_type[:3].capitalize()}{i}'
|
140 | 2be92b2c | Carles Marti | sub_order = sub_cmd % (job_name, sub_script) |
141 | 2be92b2c | Carles Marti | subm_msg = Popen(sub_order, shell=True, stdout=PIPE).communicate()[0] |
142 | 2be92b2c | Carles Marti | job_id = None
|
143 | 2be92b2c | Carles Marti | for word in subm_msg.decode("utf-8").split(): |
144 | 2be92b2c | Carles Marti | try:
|
145 | 118974d5 | Carles Marti | job_id = int(word.replace('>', '').replace('<', '')) |
146 | 2be92b2c | Carles Marti | break
|
147 | 2be92b2c | Carles Marti | except ValueError: |
148 | 2be92b2c | Carles Marti | continue
|
149 | 2be92b2c | Carles Marti | subm_jobs.append(job_id) |
150 | b461f289 | Carles Marti | os.chdir(init_dir) |
151 | b461f289 | Carles Marti | |
152 | b461f289 | Carles Marti | logger.info('All jobs have been submitted, waiting for them to finish.')
|
153 | 2be92b2c | Carles Marti | while not all([stat == 'f' for stat in |
154 | 2be92b2c | Carles Marti | get_jobs_status(subm_jobs, stat_cmd, stat_dict)]): |
155 | b461f289 | Carles Marti | sleep(30)
|
156 | b461f289 | Carles Marti | logger.info('All jobs have finished.')
|
157 | 12001182 | Carles | |
158 | 12001182 | Carles | |
159 | f3004731 | Carles | def run_calc(run_type, inp_vars, atms_list): |
160 | 3d6a9d3c | Carles | """Directs the calculation run according to the provided arguments.
|
161 | 3d6a9d3c | Carles |
|
162 | f3004731 | Carles | @param run_type: Type of calculation. 'isolated', 'screening' or
|
163 | f3004731 | Carles | 'refinement'
|
164 | 3d6a9d3c | Carles | @param inp_vars: Calculation parameters from input file.
|
165 | f3004731 | Carles | @param atms_list: List of ase.Atoms objects containing the sets of atoms
|
166 | f3004731 | Carles | aimed to run the calculations of.
|
167 | 3d6a9d3c | Carles | """
|
168 | 821dca42 | Carles Marti | from modules.utilities import check_bak |
169 | 3d6a9d3c | Carles | run_types = ['isolated', 'screening', 'refinement'] |
170 | 3d6a9d3c | Carles | if not isinstance(run_type, str) or run_type.lower() not in run_types: |
171 | 1e36f905 | Carles Marti | run_type_err = f"'run_type' must be one of the following: {run_types}"
|
172 | 3d6a9d3c | Carles | logger.error(run_type_err) |
173 | 3d6a9d3c | Carles | raise ValueError(run_type_err) |
174 | 3d6a9d3c | Carles | |
175 | 821dca42 | Carles Marti | if inp_vars['batch_q_sys']: |
176 | 821dca42 | Carles Marti | logger.info(f"Running {run_type} calculation with {inp_vars['code']} on"
|
177 | 695dcff8 | Carles Marti | f" {inp_vars['batch_q_sys']}.")
|
178 | 821dca42 | Carles Marti | else:
|
179 | 695dcff8 | Carles Marti | logger.info(f"Doing a dry run of {run_type}.")
|
180 | c3cb279a | Carles | check_bak(run_type) |
181 | c3cb279a | Carles | os.mkdir(run_type) |
182 | 1e36f905 | Carles Marti | |
183 | 1e36f905 | Carles Marti | # Prepare directories and files for relevant code.
|
184 | 07edc24f | Carles Marti | input_files = {'isolated': 'isol_inp_file', 'screening': 'screen_inp_file', |
185 | 07edc24f | Carles Marti | 'refinement': 'refine_inp_file', } |
186 | 1b54d787 | Carles Marti | if inp_vars['code'] == 'cp2k': |
187 | 07edc24f | Carles Marti | prep_cp2k(inp_vars[input_files[run_type]], run_type, atms_list, |
188 | 07edc24f | Carles Marti | inp_vars['project_name'])
|
189 | a5f73b4c | Carles | # elif: inp_vars['code'] == 'Other codes here'
|
190 | 99afde40 | Carles | |
191 | 1e36f905 | Carles Marti | # Submit/run Jobs
|
192 | 12001182 | Carles | if inp_vars['batch_q_sys'] == 'sge': |
193 | 2be92b2c | Carles Marti | stat_cmd = "qstat | grep %s | awk '{print $5}'"
|
194 | 2be92b2c | Carles Marti | stat_dict = {'r': 'r', 'p': 'qw', 'f': ''} |
195 | 2be92b2c | Carles Marti | submit_jobs(run_type, 'qsub -N %s %s', inp_vars['subm_script'], |
196 | 09c3325a | Carles Marti | stat_cmd, stat_dict, inp_vars['max_jobs'],
|
197 | b6b1b03e | Carles Marti | inp_vars['project_name'])
|
198 | 2be92b2c | Carles Marti | elif inp_vars['batch_q_sys'] == 'lsf': |
199 | 118974d5 | Carles Marti | stat_cmd = "bjobs -w | grep %s | awk '{print $3}'"
|
200 | 118974d5 | Carles Marti | stat_dict = {'r': 'RUN', 'p': 'PEND', 'f': ''} |
201 | 118974d5 | Carles Marti | submit_jobs(run_type, 'bsub -J %s < %s', inp_vars['subm_script'], |
202 | 09c3325a | Carles Marti | stat_cmd, stat_dict, inp_vars['max_jobs'],
|
203 | b6b1b03e | Carles Marti | inp_vars['project_name'])
|
204 | ec5bba46 | Carles Marti | elif inp_vars['batch_q_sys'] == 'irene': |
205 | ec5bba46 | Carles Marti | stat_cmd = "ccc_mstat | grep %s | awk '{print $10}' | cut -c1"
|
206 | ec5bba46 | Carles Marti | stat_dict = {'r': 'R', 'p': 'P', 'f': ''} |
207 | ec5bba46 | Carles Marti | submit_jobs(run_type, 'ccc_msub -r %s %s', inp_vars['subm_script'], |
208 | ec5bba46 | Carles Marti | stat_cmd, stat_dict, inp_vars['max_jobs'],
|
209 | b6b1b03e | Carles Marti | inp_vars['project_name'])
|
210 | ec5bba46 | Carles Marti | |
211 | 1a1164e0 | Carles Marti | elif inp_vars['batch_q_sys'] == 'local': |
212 | 1a1164e0 | Carles Marti | pass # TODO implement local |
213 | 1a1164e0 | Carles Marti | elif not inp_vars['batch_q_sys']: |
214 | 0db30d07 | Carles | pass |