From d2586c2e4f7755e32282d5b0e0b93a7b0d65588f Mon Sep 17 00:00:00 2001 From: Carlos Cueto Date: Thu, 18 Jul 2024 13:48:03 +0100 Subject: [PATCH] Work consistently in slowness --- docker/README.md | 6 +- mosaic/cli/mrun.py | 2 +- mosaic/comms/serialisation.py | 2 +- stride/__init__.py | 4 +- stride/core.py | 4 + stride/optimisation/loss/l2_distance.py | 4 +- .../optimisers/gradient_descent.py | 6 +- stride/optimisation/optimisers/optimiser.py | 23 ++- .../optimisation/step_length/line_search.py | 6 +- stride/physics/common/devito.py | 14 +- stride/physics/iso_acoustic/devito.py | 155 +++++++++++------- stride/physics/iso_elastic/devito.py | 18 +- stride/physics/marmottant/devito.py | 6 +- stride/physics/problem_type.py | 42 +++-- stride/problem/data.py | 29 +++- 15 files changed, 199 insertions(+), 122 deletions(-) diff --git a/docker/README.md b/docker/README.md index 27f7c710..32bc49b1 100644 --- a/docker/README.md +++ b/docker/README.md @@ -81,19 +81,19 @@ docker build --network=host --file docker/Dockerfile.stride --tag stride . And to build the GPU image with `openacc` offloading and the `nvc` compiler, simply run: ```bash -docker build --build-arg base=devitocodes/base:nvidia-nvc --network=host --file docker/Dockerfile.stride --tag stride . +docker build --build-arg base=devitocodes/bases:nvidia-nvc --network=host --file docker/Dockerfile.stride --tag stride . ``` or if you wish to use the `llvm-15` (clang) compiler with `openmp` offlaoding: ```bash -docker build --build-arg base=devitocodes/base:nvidia-clang --network=host --file docker/Dockerfile.stride --tag stride . +docker build --build-arg base=devitocodes/bases:nvidia-clang --network=host --file docker/Dockerfile.stride --tag stride . ``` and finally for AMD architectures: ```bash -docker build --build-arg base=devitocodes/base:amd --network=host --file docker/Dockerfile.stride --tag stride . +docker build --build-arg base=devitocodes/bases:amd --network=host --file docker/Dockerfile.stride --tag stride . ``` diff --git a/mosaic/cli/mrun.py b/mosaic/cli/mrun.py index 38baeadb..917127ba 100644 --- a/mosaic/cli/mrun.py +++ b/mosaic/cli/mrun.py @@ -146,7 +146,7 @@ def start_runtime(*args, **extra_kwargs): _runtime.init_file(runtime_config) def run_head(): - process = cmd_subprocess.run(cmd, + process = cmd_subprocess.run(' '.join(cmd), shell=True, stdout=_stdout, stderr=_stderr) diff --git a/mosaic/comms/serialisation.py b/mosaic/comms/serialisation.py index 4d3f6f94..348f9833 100644 --- a/mosaic/comms/serialisation.py +++ b/mosaic/comms/serialisation.py @@ -35,7 +35,7 @@ def serialise(data): """ try: return pickle5_dumps(data) - except pickle.PicklingError: + except (pickle.PicklingError, AttributeError): return cloudpickle.dumps(data), [] diff --git a/stride/__init__.py b/stride/__init__.py index f8e4178c..fab679b5 100644 --- a/stride/__init__.py +++ b/stride/__init__.py @@ -108,7 +108,7 @@ async def forward(problem, pde, *args, **kwargs): published_args = await asyncio.gather(*published_args) platform = kwargs.get('platform', 'cpu') - using_gpu = platform in ['nvidia-acc', 'gpu'] + using_gpu = 'nvidia' in platform or 'gpu' in platform if using_gpu: devices = kwargs.pop('devices', None) num_gpus = gpu_count() if devices is None else len(devices) @@ -251,7 +251,7 @@ async def adjoint(problem, pde, loss, optimisation_loop, optimiser, *args, **kwa keep_residual = isinstance(step_size, LineSearch) platform = kwargs.get('platform', 'cpu') - using_gpu = platform in ['nvidia-acc', 'gpu'] + using_gpu = 'nvidia' in platform or 'gpu' in platform if using_gpu: devices = kwargs.pop('devices', None) num_gpus = gpu_count() if devices is None else len(devices) diff --git a/stride/core.py b/stride/core.py index 2f667b02..173ca64a 100644 --- a/stride/core.py +++ b/stride/core.py @@ -288,6 +288,7 @@ def __init__(self, *args, **kwargs): self.grad = None self.prec = None + self.transform = kwargs.pop('transform', None) self.graph = Graph() self.prev_op = None @@ -384,6 +385,7 @@ def detach(self, *args, **kwargs): """ kwargs['name'] = kwargs.pop('name', self._init_name) kwargs['needs_grad'] = kwargs.pop('needs_grad', self.needs_grad) + kwargs['transform'] = kwargs.pop('transform', self.transform) if hasattr(self, 'has_tessera') and self.has_tessera: cpy = self.__class__.parameter(*args, **kwargs) @@ -411,6 +413,7 @@ def as_parameter(self, *args, **kwargs): """ kwargs['name'] = kwargs.pop('name', self._init_name) kwargs['needs_grad'] = kwargs.pop('needs_grad', self.needs_grad) + kwargs['transform'] = kwargs.pop('transform', self.transform) cpy = self.__class__.parameter(*args, **kwargs) @@ -437,6 +440,7 @@ def copy(self, *args, **kwargs): """ kwargs['name'] = kwargs.pop('name', self._init_name) kwargs['needs_grad'] = kwargs.pop('needs_grad', self.needs_grad) + kwargs['transform'] = kwargs.pop('transform', self.transform) propagate_tessera = kwargs.pop('propagate_tessera', True) diff --git a/stride/optimisation/loss/l2_distance.py b/stride/optimisation/loss/l2_distance.py index 01ab0988..fd5b69ff 100644 --- a/stride/optimisation/loss/l2_distance.py +++ b/stride/optimisation/loss/l2_distance.py @@ -24,7 +24,7 @@ def __init__(self, **kwargs): self.residual = None - async def forward(self, modelled, observed, **kwargs): + def forward(self, modelled, observed, **kwargs): problem = kwargs.pop('problem', None) shot_id = problem.shot_id if problem is not None \ else kwargs.pop('shot_id', 0) @@ -38,7 +38,7 @@ async def forward(self, modelled, observed, **kwargs): return fun - async def adjoint(self, d_fun, modelled, observed, **kwargs): + def adjoint(self, d_fun, modelled, observed, **kwargs): grad_modelled = None if modelled.needs_grad: grad_modelled = +np.asarray(d_fun) * self.residual.copy(name='modelledresidual') diff --git a/stride/optimisation/optimisers/gradient_descent.py b/stride/optimisation/optimisers/gradient_descent.py index d91cc781..21a7dd8e 100644 --- a/stride/optimisation/optimisers/gradient_descent.py +++ b/stride/optimisation/optimisers/gradient_descent.py @@ -30,6 +30,6 @@ async def pre_process(self, grad=None, processed_grad=None, **kwargs): **kwargs) return processed_grad - async def update_variable(self, step_size, direction): - self.variable.data[:] -= step_size * direction.data - return self.variable + def update_variable(self, step_size, variable, direction): + variable.data[:] -= step_size * direction.data + return variable diff --git a/stride/optimisation/optimisers/optimiser.py b/stride/optimisation/optimisers/optimiser.py index 145a4a4f..87e05533 100644 --- a/stride/optimisation/optimisers/optimiser.py +++ b/stride/optimisation/optimisers/optimiser.py @@ -96,6 +96,7 @@ async def pre_process(self, grad=None, processed_grad=None, **kwargs): if dump_prec and self.variable.grad.prec is not None and problem is not None: self.variable.grad.prec.dump(path=problem.output_folder, project_name=problem.name, + parameter='raw_%s' % self.variable.grad.prec.name, version=iteration.abs_id+1) grad = self.variable.process_grad(**kwargs) @@ -105,6 +106,11 @@ async def pre_process(self, grad=None, processed_grad=None, **kwargs): project_name=problem.name, version=iteration.abs_id+1) + if dump_prec and self.variable.grad.prec is not None and problem is not None: + self.variable.grad.prec.dump(path=problem.output_folder, + project_name=problem.name, + version=iteration.abs_id+1) + min_dir = np.min(grad.data) max_dir = np.max(grad.data) @@ -171,7 +177,7 @@ async def step(self, step_size=None, grad=None, processed_grad=None, **kwargs): step_size = self.step_size if step_size is None else step_size step_loop = kwargs.pop('step_loop', None) if isinstance(step_size, LineSearch): - await step_size.init_search( + step_size.init_search( variable=self.variable, direction=direction, **kwargs @@ -185,7 +191,7 @@ async def step(self, step_size=None, grad=None, processed_grad=None, **kwargs): next_step = 1. done_search = True else: - next_step, done_search = await step_size.next_step( + next_step, done_search = step_size.next_step( variable=self.variable, direction=direction, **kwargs @@ -216,7 +222,14 @@ async def step(self, step_size=None, grad=None, processed_grad=None, **kwargs): self.variable.data[:] = variable_before.data.copy() # update variable - await self.update_variable(next_step, direction) + if self.variable.transform is not None: + variable = self.variable.transform(self.variable) + else: + variable = self.variable + upd_variable = self.update_variable(next_step, variable, direction) + if self.variable.transform is not None: + upd_variable = self.variable.transform(upd_variable) + self.variable.data[:] = upd_variable.data.copy() # post-process variable after update await self.post_process(**kwargs) @@ -262,13 +275,15 @@ async def post_process(self, **kwargs): self.variable.release_grad() @abstractmethod - async def update_variable(self, step_size, direction): + def update_variable(self, step_size, variable, direction): """ Parameters ---------- step_size : float Step size to use for updating the variable. + variable : Data + Variable to update. direction : Data Direction in which to update the variable. diff --git a/stride/optimisation/step_length/line_search.py b/stride/optimisation/step_length/line_search.py index 65a47d9e..84831ee8 100644 --- a/stride/optimisation/step_length/line_search.py +++ b/stride/optimisation/step_length/line_search.py @@ -8,12 +8,12 @@ class LineSearch: @abstractmethod - async def init_search(self, variable, direction, **kwargs): + def init_search(self, variable, direction, **kwargs): pass @abstractmethod - async def next_step(self, variable, direction, **kwargs): + def next_step(self, variable, direction, **kwargs): pass - async def forward_test(self, variable, direction, **kwargs): + def forward_test(self, variable, direction, **kwargs): pass diff --git a/stride/physics/common/devito.py b/stride/physics/common/devito.py index a939098b..a5e688d1 100644 --- a/stride/physics/common/devito.py +++ b/stride/physics/common/devito.py @@ -906,14 +906,14 @@ def set_operator(self, op, **kwargs): default_config = { 'name': self.name, 'subs': subs, - 'opt': 'advanced-fsg', + 'opt': 'advanced', } elif platform == 'cpu-icc': default_config = { 'name': self.name, 'subs': subs, - 'opt': 'advanced-fsg', + 'opt': 'advanced', 'compiler': 'icc', } @@ -921,7 +921,7 @@ def set_operator(self, op, **kwargs): default_config = { 'name': self.name, 'subs': subs, - 'opt': 'advanced-fsg', + 'opt': 'advanced', 'compiler': 'nvc', } @@ -929,7 +929,7 @@ def set_operator(self, op, **kwargs): default_config = { 'name': self.name, 'subs': subs, - 'opt': 'advanced-fsg', + 'opt': 'advanced', 'autotuning': 'off', 'compiler': 'nvc', 'language': 'openacc', @@ -940,7 +940,7 @@ def set_operator(self, op, **kwargs): default_config = { 'name': self.name, 'subs': subs, - 'opt': 'advanced-fsg', + 'opt': 'advanced', 'compiler': 'cuda', 'language': 'cuda', 'platform': 'nvidiaX', @@ -950,7 +950,7 @@ def set_operator(self, op, **kwargs): default_config = { 'name': self.name, 'subs': subs, - 'opt': 'advanced-fsg', + 'opt': 'advanced', 'compiler': 'hip', 'language': 'hip', 'platform': 'amdgpuX', @@ -964,7 +964,7 @@ def set_operator(self, op, **kwargs): context = {'log-level': 'DEBUG' if log_level in ['perf', 'debug'] else 'INFO'} compiler_config = {} for key, value in default_config.items(): - if key in devito.configuration: + if key in devito.configuration and key != 'opt': context[key] = value else: compiler_config[key] = value diff --git a/stride/physics/iso_acoustic/devito.py b/stride/physics/iso_acoustic/devito.py index 554e6314..10b480bf 100644 --- a/stride/physics/iso_acoustic/devito.py +++ b/stride/physics/iso_acoustic/devito.py @@ -220,7 +220,7 @@ def subdomains(self): # forward - async def before_forward(self, wavelets, vp, rho=None, alpha=None, **kwargs): + def before_forward(self, wavelets, vp, rho=None, alpha=None, **kwargs): """ Prepare the problem type to run the state or forward problem. @@ -318,6 +318,7 @@ async def before_forward(self, wavelets, vp, rho=None, alpha=None, **kwargs): save_wavefield |= alpha.needs_grad platform = kwargs.get('platform', 'cpu') + stream_wavefield = kwargs.pop('stream_wavefield', True) is_nvidia = platform is not None and 'nvidia' in platform is_nvc = platform is not None and (is_nvidia or 'nvc' in platform) @@ -365,7 +366,10 @@ async def before_forward(self, wavelets, vp, rho=None, alpha=None, **kwargs): # Define the saving of the wavefield if save_wavefield is True: space_order = None if self._needs_grad(rho, alpha) else 0 - layers = devito.HostDevice if is_nvidia else devito.NoLayers + if stream_wavefield: + layers = devito.HostDevice if is_nvidia else devito.NoLayers + else: + layers = devito.Device if is_nvidia else devito.NoLayers p_saved = self.dev_grid.undersampled_time_function('p_saved', time_bounds=time_bounds, factor=self.undersampling_factor, @@ -470,9 +474,6 @@ async def before_forward(self, wavelets, vp, rho=None, alpha=None, **kwargs): # Set geometry and wavelet wavelets = wavelets.data - # if fw3d_mode: - # wavelets[:, 1:] = wavelets[:, :-1] - if diff_source: wavelets = np.gradient(wavelets, self.time.step, axis=-1) @@ -486,7 +487,7 @@ async def before_forward(self, wavelets, vp, rho=None, alpha=None, **kwargs): self.dev_grid.vars.src.coordinates.data[:] = shot.source_coordinates self.dev_grid.vars.rec.coordinates.data[:] = shot.receiver_coordinates - async def run_forward(self, wavelets, vp, rho=None, alpha=None, **kwargs): + def run_forward(self, wavelets, vp, rho=None, alpha=None, **kwargs): """ Run the state or forward problem. @@ -554,7 +555,7 @@ async def run_forward(self, wavelets, vp, rho=None, alpha=None, **kwargs): **functions, **devito_args) - async def after_forward(self, wavelets, vp, rho=None, alpha=None, **kwargs): + def after_forward(self, wavelets, vp, rho=None, alpha=None, **kwargs): """ Clean up after the state run and retrieve the time traces. @@ -660,7 +661,7 @@ def _rm_tmpdir(): # adjoint - async def before_adjoint(self, adjoint_source, wavelets, vp, rho=None, alpha=None, **kwargs): + def before_adjoint(self, adjoint_source, wavelets, vp, rho=None, alpha=None, **kwargs): """ Prepare the problem type to run the adjoint problem. @@ -727,7 +728,7 @@ async def before_adjoint(self, adjoint_source, wavelets, vp, rho=None, alpha=Non src_term = [] # Define gradient - gradient_update = await self.prepare_grad(wavelets, vp, rho, alpha, **kwargs) + gradient_update = self.prepare_grad(wavelets, vp, rho, alpha, **kwargs) # Maybe save wavefield dump_adjoint_wavefield = kwargs.pop('dump_adjoint_wavefield', False) @@ -780,7 +781,7 @@ async def before_adjoint(self, adjoint_source, wavelets, vp, rho=None, alpha=Non self.dev_grid.vars.src.data_with_halo.fill(0.) self.dev_grid.vars.p_a.data_with_halo.fill(0.) self.boundary.clear() - await self.init_grad(wavelets, vp, rho, alpha, **kwargs) + self.init_grad(wavelets, vp, rho, alpha, **kwargs) # Set wavefield if necessary cache_forward = kwargs.pop('cache_forward', False) @@ -827,9 +828,6 @@ async def before_adjoint(self, adjoint_source, wavelets, vp, rho=None, alpha=Non # Set geometry and adjoint source adjoint_source = adjoint_source.data - # if fw3d_mode: - # adjoint_source[:, 1:] = adjoint_source[:, :-1] - window = scipy.signal.get_window(('tukey', 0.001), time_bounds[1]-time_bounds[0], False) window = np.pad(window, ((time_bounds[0], self.time.num-time_bounds[1]),), mode='constant', constant_values=0.) window = window.reshape((self.time.num, 1)) @@ -840,7 +838,7 @@ async def before_adjoint(self, adjoint_source, wavelets, vp, rho=None, alpha=Non self.dev_grid.vars.src.coordinates.data[:] = shot.source_coordinates self.dev_grid.vars.rec.coordinates.data[:] = shot.receiver_coordinates - async def run_adjoint(self, adjoint_source, wavelets, vp, rho=None, alpha=None, **kwargs): + def run_adjoint(self, adjoint_source, wavelets, vp, rho=None, alpha=None, **kwargs): """ Run the adjoint problem. @@ -886,7 +884,7 @@ async def run_adjoint(self, adjoint_source, wavelets, vp, rho=None, alpha=None, **functions, **devito_args) - async def after_adjoint(self, adjoint_source, wavelets, vp, rho=None, alpha=None, **kwargs): + def after_adjoint(self, adjoint_source, wavelets, vp, rho=None, alpha=None, **kwargs): """ Clean up after the adjoint run and retrieve the time gradients (if needed). @@ -922,7 +920,7 @@ async def after_adjoint(self, adjoint_source, wavelets, vp, rho=None, alpha=None if dump_adjoint_wavefield and dump_wavefield_id == shot.id: self.logger.perf('(ShotID %d) Dumping adjoint wavefield' % problem.shot_id) - iteration = kwargs.pop('iteration', None) + iteration = kwargs.get('iteration', None) version = iteration.abs_id+1 if iteration is not None else 0 p_dump_data = np.asarray(self.dev_grid.vars.p_a_dump.data, dtype=np.float32) p_dump = StructuredData(name='adjoint_wavefield-Shot%05d' % shot.id, @@ -945,11 +943,11 @@ async def after_adjoint(self, adjoint_source, wavelets, vp, rho=None, alpha=None self.dev_grid.deallocate('buoy') self.dev_grid.deallocate('alpha', collect=True) - return await self.get_grad(wavelets, vp, rho, alpha, **kwargs) + return self.get_grad(wavelets, vp, rho, alpha, **kwargs) # gradients - async def prepare_grad_vp(self, vp, **kwargs): + def prepare_grad_vp(self, vp, **kwargs): """ Prepare the problem type to calculate the gradients wrt Vp. @@ -990,7 +988,7 @@ async def prepare_grad_vp(self, vp, **kwargs): return p_dt_update + (grad_update, prec_update) - async def init_grad_vp(self, vp, **kwargs): + def init_grad_vp(self, vp, **kwargs): """ Initialise buffers in the problem type to calculate the gradients wrt Vp. @@ -1009,7 +1007,7 @@ async def init_grad_vp(self, vp, **kwargs): prec = self.dev_grid.function('prec_vp') prec.data_with_halo.fill(0.) - async def get_grad_vp(self, vp, **kwargs): + def get_grad_vp(self, vp, **kwargs): """ Retrieve the gradients calculated wrt to the input. @@ -1032,7 +1030,20 @@ async def get_grad_vp(self, vp, **kwargs): variable_prec = self.dev_grid.vars.prec_vp variable_prec = np.asarray(variable_prec.data[self.space.inner], dtype=np.float32) - variable_grad *= -2 / vp.data**3 + is_slowness = False + if vp.transform is not None: + # try to figure out if the user wants slowness by testing the provided transform + try: + is_slowness = 1/vp.transform(10) == 10 + except Exception: + pass + + if is_slowness: + variable_grad *= +1 / vp.data + variable_prec *= (1 / vp.data)**2 + else: + variable_grad *= -2 / vp.data**3 + variable_prec *= (2 / vp.data)**3**2 deallocate = kwargs.pop('deallocate', False) if deallocate: @@ -1066,7 +1077,7 @@ async def get_grad_vp(self, vp, **kwargs): return grad - async def prepare_grad_rho(self, rho, **kwargs): + def prepare_grad_rho(self, rho, **kwargs): """ Prepare the problem type to calculate the gradients wrt rho. @@ -1103,7 +1114,7 @@ async def prepare_grad_rho(self, rho, **kwargs): return grad_term_update + (grad_update, prec_update) - async def init_grad_rho(self, rho, **kwargs): + def init_grad_rho(self, rho, **kwargs): """ Initialise buffers in the problem type to calculate the gradients wrt rho. @@ -1122,7 +1133,7 @@ async def init_grad_rho(self, rho, **kwargs): prec = self.dev_grid.function('prec_rho') prec.data_with_halo.fill(0.) - async def get_grad_rho(self, rho, **kwargs): + def get_grad_rho(self, rho, **kwargs): """ Retrieve the gradients calculated wrt to rho. @@ -1365,8 +1376,14 @@ def _check_conditions(self, wavelets, vp, rho=None, alpha=None, def _stencil(self, field, wavelets, vp, rho=None, alpha=None, direction='forward', save_wavefield=False, **kwargs): + stencils = [] + # Prepare medium functions vp_fun, vp2_fun, inv_vp2_fun, rho_fun, buoy_fun, alpha_fun = self._medium_functions(vp, rho, alpha, **kwargs) + if rho is not None: + rho_constant = np.isclose(np.min(rho.extended_data), np.max(rho.extended_data)) + else: + rho_constant = False # Forward or backward forward = direction == 'forward' @@ -1381,30 +1398,51 @@ def _stencil(self, field, wavelets, vp, rho=None, alpha=None, direction='forward **kwargs) # Get the spatial FD - laplacian = self.dev_grid.function('laplacian', - coefficients='symbolic' if self.drp else 'standard') - laplacian_update = self._laplacian(field, laplacian, vp_fun, vp2_fun, inv_vp2_fun, - rho=rho_fun, buoy=buoy_fun, alpha=alpha_fun, - **kwargs) - if self.kernel == 'OT2': - laplacian_term = self._diff_op(laplacian_update, + # get the subs + if self.drp: + extra_functions = () + subs = self._symbolic_coefficients(field, *extra_functions) + else: + subs = None + + laplacian_term = self._diff_op(field, vp_fun, vp2_fun, inv_vp2_fun, rho=rho_fun, buoy=buoy_fun, alpha=alpha_fun, + rho_constant=rho_constant, **kwargs) else: - laplacian_term = self._diff_op(laplacian, - vp_fun, vp2_fun, inv_vp2_fun, - rho=rho_fun, buoy=buoy_fun, alpha=alpha_fun, - **kwargs) + laplacian_2 = self.dev_grid.function('laplacian', + coefficients='symbolic' if self.drp else 'standard') - # Get the subs - if self.drp: - extra_functions = () - subs = self._symbolic_coefficients(field, laplacian, - *extra_functions) - else: - subs = None + # get the subs + if self.drp: + extra_functions = () + subs = self._symbolic_coefficients(field, laplacian_2, *extra_functions) + else: + subs = None + + # first laplacian application - L2 + laplacian_term_2 = self._diff_op(field, + vp_fun, vp2_fun, inv_vp2_fun, + rho=rho_fun, buoy=buoy_fun, alpha=alpha_fun, + rho_constant=rho_constant, + **kwargs) + + stencil_laplacian = devito.Eq(laplacian_2, laplacian_term_2, + subdomain=abox, + coefficients=subs) + stencils.append(stencil_laplacian) + + # second laplacian application - L4 + laplacian_term_4 = self._diff_op(laplacian_2, + vp_fun, vp2_fun, inv_vp2_fun, + rho=rho_fun, buoy=buoy_fun, alpha=alpha_fun, + rho_constant=rho_constant, + **kwargs) + + # final term + laplacian_term = self._laplacian(laplacian_2, laplacian_term_4) # Get the attenuation term if alpha_fun is not None and self.attenuation_power is not None: @@ -1421,7 +1459,7 @@ def _stencil(self, field, wavelets, vp, rho=None, alpha=None, direction='forward attenuation_term = 0 # Set up the boundary - boundary_field = laplacian if self.kernel != 'OT2' and 'PML' in self.boundary_type else field + boundary_field = laplacian_2 if self.kernel != 'OT2' and 'PML' in self.boundary_type else field boundary_term, eq_before, eq_after = self.boundary.apply(boundary_field, vp.extended_data, velocity_fun=vp_fun, direction=direction, subs=subs, @@ -1454,14 +1492,6 @@ def _stencil(self, field, wavelets, vp, rho=None, alpha=None, direction='forward - vp2_fun*sub_exprs, u_next) # Time-stepping stencil - stencils = [] - - if self.kernel != 'OT2': - stencil_laplacian = devito.Eq(laplacian, laplacian_update, - subdomain=abox, - coefficients=subs) - stencils.append(stencil_laplacian) - if 'hybrid' in self.boundary_type: domain = abox else: @@ -1510,7 +1540,7 @@ def _medium_functions(self, vp, rho=None, alpha=None, **kwargs): return vp_fun, vp2_fun, inv_vp2_fun, rho_fun, buoy_fun, alpha_fun - def _laplacian(self, field, laplacian, vp, vp2, inv_vp2, **kwargs): + def _laplacian(self, laplacian_2, laplacian_4, **kwargs): if self.kernel not in ['OT2', 'OT4']: raise ValueError("Unrecognized kernel") @@ -1518,22 +1548,33 @@ def _laplacian(self, field, laplacian, vp, vp2, inv_vp2, **kwargs): bi_harmonic = 0 else: - bi_harmonic = self.time.step**2/12 * self._diff_op(field, - vp, vp2, inv_vp2, - **kwargs) + bi_harmonic = self.time.step**2/12 * laplacian_4 - laplacian_update = field + bi_harmonic + laplacian_update = laplacian_2 + bi_harmonic return laplacian_update def _diff_op(self, field, vp, vp2, inv_vp2, **kwargs): rho = kwargs.pop('rho', None) buoy = kwargs.pop('buoy', None) + rho_constant = kwargs.pop('rho_constant', False) if buoy is None: return vp2 * field.laplace else: - return vp2 * rho * devito.div(buoy * devito.grad(field, shift=+0.5), shift=-0.5) + if rho_constant: + return vp2 * self._div_op(self._grad_op(field, shift=+1), shift=-1) + else: + return vp2 * rho * self._div_op(self._mul_buoy(buoy, self._grad_op(field, shift=+1)), shift=-1) + + def _grad_op(self, f, shift=+1): + return devito.grad(f, shift=shift * 0.5) + + def _div_op(self, fs, shift=-1): + return devito.div(fs, shift=shift * 0.5) + + def _mul_buoy(self, buoy, fs): + return buoy * fs def _subdomains(self, *args, **kwargs): problem = kwargs.get('problem') diff --git a/stride/physics/iso_elastic/devito.py b/stride/physics/iso_elastic/devito.py index bf8c8f03..157a5af9 100644 --- a/stride/physics/iso_elastic/devito.py +++ b/stride/physics/iso_elastic/devito.py @@ -81,7 +81,7 @@ def clear_operators(self): # forward - async def before_forward(self, wavelets, vp, vs, rho, **kwargs): + def before_forward(self, wavelets, vp, vs, rho, **kwargs): """ Prepare the problem type to run the state or forward problem. @@ -204,7 +204,7 @@ async def before_forward(self, wavelets, vp, vs, rho, **kwargs): self.dev_grid.vars.src.coordinates.data[:] = shot.source_coordinates self.dev_grid.vars.rec_tau.coordinates.data[:] = shot.receiver_coordinates - async def run_forward(self, wavelets, vp, vs, rho, **kwargs): + def run_forward(self, wavelets, vp, vs, rho, **kwargs): """ Run the state or forward problem. @@ -234,7 +234,7 @@ async def run_forward(self, wavelets, vp, vs, rho, **kwargs): **functions, **kwargs.pop('devito_args', {})) - async def after_forward(self, wavelets, vp, vs, rho, **kwargs): + def after_forward(self, wavelets, vp, vs, rho, **kwargs): """ Clean up after the state run and retrieve the time traces. @@ -277,19 +277,19 @@ async def after_forward(self, wavelets, vp, vs, rho, **kwargs): # adjoint - async def before_adjoint(self, adjoint_source, wavelets, vp, rho=None, alpha=None, **kwargs): + def before_adjoint(self, adjoint_source, wavelets, vp, rho=None, alpha=None, **kwargs): """ Not implemented """ pass - async def run_adjoint(self, adjoint_source, wavelets, vp, rho=None, alpha=None, **kwargs): + def run_adjoint(self, adjoint_source, wavelets, vp, rho=None, alpha=None, **kwargs): """ Not implemented """ pass - async def after_adjoint(self, **kwargs): + def after_adjoint(self, **kwargs): """ Not implemented """ @@ -297,19 +297,19 @@ async def after_adjoint(self, **kwargs): # gradients - async def prepare_grad_vp(self, **kwargs): + def prepare_grad_vp(self, **kwargs): """ Not implemented """ pass - async def init_grad_vp(self, **kwargs): + def init_grad_vp(self, **kwargs): """ Not implemented """ pass - async def get_grad_vp(self, **kwargs): + def get_grad_vp(self, **kwargs): """ Not implemented """ diff --git a/stride/physics/marmottant/devito.py b/stride/physics/marmottant/devito.py index 4eb19556..bbd61b7b 100644 --- a/stride/physics/marmottant/devito.py +++ b/stride/physics/marmottant/devito.py @@ -101,7 +101,7 @@ def clear_operators(self): # forward - async def before_forward(self, r_0, x_0=None, + def before_forward(self, r_0, x_0=None, vp=1540., rho=997, sigma=0.073, mu=0.002, p_0=101325, p=0., kappa=1.07, kappa_s=5E-9, chi=0.4, r_buckle=None, r_break=None, **kwargs): @@ -159,7 +159,7 @@ async def before_forward(self, r_0, x_0=None, self.state_operator.set_operator(init_terms + stencil, **kwargs) self.state_operator.compile() - async def run_forward(self, *args, **kwargs): + def run_forward(self, *args, **kwargs): """ Run the state or forward problem. @@ -178,7 +178,7 @@ async def run_forward(self, *args, **kwargs): **functions, **kwargs.pop('devito_args', {})) - async def after_forward(self, *args, **kwargs): + def after_forward(self, *args, **kwargs): """ Clean up after the state run and retrieve the time traces. diff --git a/stride/physics/problem_type.py b/stride/physics/problem_type.py index 26ffed4d..92cd7bfe 100644 --- a/stride/physics/problem_type.py +++ b/stride/physics/problem_type.py @@ -1,4 +1,3 @@ - from abc import ABC import mosaic @@ -6,7 +5,6 @@ from ..core import Operator from ..problem.base import Gridded - __all__ = ['ProblemTypeBase'] @@ -56,7 +54,7 @@ def __init__(self, **kwargs): Gridded.__init__(self, **kwargs) Operator.__init__(self, **kwargs) - async def forward(self, *args, **kwargs): + def forward(self, *args, **kwargs): """ Run the state or forward problem. @@ -73,18 +71,18 @@ async def forward(self, *args, **kwargs): pre_str = '(ShotID %d) ' % problem.shot_id self.logger.perf('%sPreparing to run state for shot' % pre_str) - await self.before_forward(*args, **kwargs) + self.before_forward(*args, **kwargs) self.logger.perf('%sRunning state equation for shot' % pre_str) - await self.run_forward(*args, **kwargs) + self.run_forward(*args, **kwargs) self.logger.perf('%sCompleting state equation run for shot' % pre_str) - output = await self.after_forward(*args, **kwargs) + output = self.after_forward(*args, **kwargs) self.logger.perf('%sCompleted state equation run for shot' % pre_str) return output - async def adjoint(self, *args, **kwargs): + def adjoint(self, *args, **kwargs): """ Run the adjoint problem. @@ -101,18 +99,18 @@ async def adjoint(self, *args, **kwargs): pre_str = '(ShotID %d) ' % problem.shot_id self.logger.perf('%sPreparing to run adjoint for shot' % pre_str) - await self.before_adjoint(*args, **kwargs) + self.before_adjoint(*args, **kwargs) self.logger.perf('%sRunning adjoint equation for shot' % pre_str) - await self.run_adjoint(*args, **kwargs) + self.run_adjoint(*args, **kwargs) self.logger.perf('%sCompleting adjoint equation run for shot' % pre_str) - output = await self.after_adjoint(*args, **kwargs) + output = self.after_adjoint(*args, **kwargs) self.logger.perf('%sCompleted adjoint equation run for shot' % pre_str) return output - async def before_forward(self, *args, **kwargs): + def before_forward(self, *args, **kwargs): """ Prepare the problem type to run the state or forward problem. @@ -126,7 +124,7 @@ async def before_forward(self, *args, **kwargs): raise NotImplementedError('before_forward has not been implemented ' 'for objects of type %s' % self.__class__.__name__) - async def run_forward(self, *args, **kwargs): + def run_forward(self, *args, **kwargs): """ Run the state or forward problem. @@ -140,7 +138,7 @@ async def run_forward(self, *args, **kwargs): raise NotImplementedError('run_forward has not been implemented ' 'for objects of type %s' % self.__class__.__name__) - async def after_forward(self, *args, **kwargs): + def after_forward(self, *args, **kwargs): """ Clean up after the state run and retrieve the outputs. @@ -156,7 +154,7 @@ async def after_forward(self, *args, **kwargs): raise NotImplementedError('after_forward has not been implemented ' 'for objects of type %s' % self.__class__.__name__) - async def before_adjoint(self, *args, **kwargs): + def before_adjoint(self, *args, **kwargs): """ Prepare the problem type to run the adjoint problem. @@ -170,7 +168,7 @@ async def before_adjoint(self, *args, **kwargs): raise NotImplementedError('before_adjoint has not been implemented ' 'for objects of type %s' % self.__class__.__name__) - async def run_adjoint(self, *args, **kwargs): + def run_adjoint(self, *args, **kwargs): """ Run the adjoint problem. @@ -184,7 +182,7 @@ async def run_adjoint(self, *args, **kwargs): raise NotImplementedError('run_adjoint has not been implemented ' 'for objects of type %s' % self.__class__.__name__) - async def after_adjoint(self, *args, **kwargs): + def after_adjoint(self, *args, **kwargs): """ Clean up after the adjoint run and retrieve the gradients (if needed). @@ -200,7 +198,7 @@ async def after_adjoint(self, *args, **kwargs): raise NotImplementedError('after_adjoint has not been implemented ' 'for objects of type %s' % self.__class__.__name__) - async def prepare_grad(self, *wrt, **kwargs): + def prepare_grad(self, *wrt, **kwargs): """ Prepare the problem type to calculate the gradients wrt the inputs. @@ -229,7 +227,7 @@ async def prepare_grad(self, *wrt, **kwargs): if method is None: raise ValueError('Variable %s not implemented' % variable.name) - update = await method(variable, wrt=wrt, **kwargs) + update = method(variable, wrt=wrt, **kwargs) if not isinstance(update, tuple): update = (update,) @@ -238,7 +236,7 @@ async def prepare_grad(self, *wrt, **kwargs): return gradient_update - async def init_grad(self, *wrt, **kwargs): + def init_grad(self, *wrt, **kwargs): """ Initialise buffers in the problem type to calculate the gradients wrt the inputs. @@ -263,9 +261,9 @@ async def init_grad(self, *wrt, **kwargs): if method is None: raise ValueError('Variable %s not implemented' % variable.name) - await method(variable, wrt=wrt, **kwargs) + method(variable, wrt=wrt, **kwargs) - async def get_grad(self, *wrt, **kwargs): + def get_grad(self, *wrt, **kwargs): """ Retrieve the gradients calculated wrt to the inputs. @@ -294,6 +292,6 @@ async def get_grad(self, *wrt, **kwargs): if method is None: raise ValueError('Variable %s not implemented' % variable.name) - grads.append(await method(variable, wrt=wrt, **kwargs)) + grads.append(method(variable, wrt=wrt, **kwargs)) return tuple(grads) diff --git a/stride/problem/data.py b/stride/problem/data.py index 0b5d9ea0..3e024ad4 100644 --- a/stride/problem/data.py +++ b/stride/problem/data.py @@ -120,6 +120,10 @@ class StructuredData(Data): """ def __init__(self, **kwargs): + # hacky, but does the trick for now + name = kwargs.get('name', None) + if name is not None and 'vp' in name: + kwargs['transform'] = kwargs.pop('transform', lambda x: 1 / x) super().__init__(**kwargs) shape = kwargs.pop('shape', None) @@ -365,7 +369,7 @@ def process_grad(self, global_prec=True, **kwargs): self.grad.apply_prec(**kwargs) return self.grad - def apply_prec(self, prec_scale=4.0, prec_smooth=1.0, prec_op=None, prec=None, **kwargs): + def apply_prec(self, prec_scale=4.0, prec_smooth=None, prec_op=None, prec=None, **kwargs): """ Apply a pre-conditioner to the current field. @@ -400,8 +404,7 @@ def apply_prec(self, prec_scale=4.0, prec_smooth=1.0, prec_op=None, prec=None, * prec.data[:] = prec_op(prec.data) non_zero = np.abs(prec.data) > 0. - prec.data[non_zero] = 1/prec.data[non_zero] - self.data[non_zero] *= prec.data[non_zero] + self.data[non_zero] *= 1/prec.data[non_zero] return self @@ -593,6 +596,15 @@ def __truediv__(self, other): return res + def __rtruediv__(self, other): + res, other_data = self._prepare_op(other) + res.extended_data[:] = res.extended_data.__rtruediv__(other_data) + + self._op_grad(res, other, '__rtruediv__') + self._op_prec(res, other, '__rtruediv__') + + return res + def __floordiv__(self, other): res, other_data = self._prepare_op(other) res.extended_data[:] = res.extended_data.__floordiv__(other_data) @@ -602,6 +614,15 @@ def __floordiv__(self, other): return res + def __rfloordiv__(self, other): + res, other_data = self._prepare_op(other) + res.extended_data[:] = res.extended_data.__rfloordiv__(other_data) + + self._op_grad(res, other, '__rfloordiv__') + self._op_prec(res, other, '__rfloordiv__') + + return res + def __iadd__(self, other): res = self other_data = self._prepare_other(other) @@ -661,8 +682,6 @@ def __ifloordiv__(self, other): __radd__ = __add__ __rsub__ = __sub__ __rmul__ = __mul__ - __rtruediv__ = __truediv__ - __rfloordiv__ = __floordiv__ def __get_desc__(self, **kwargs): if self._data is None: