[cig-commits] [commit] devel,master: bug fix for gpu simulations with stacey absorbing boundaries; updates gpu kernel headers (95124e5)

cig_noreply at geodynamics.org cig_noreply at geodynamics.org
Thu Nov 6 08:28:45 PST 2014


Repository : https://github.com/geodynamics/specfem3d_globe

On branches: devel,master
Link       : https://github.com/geodynamics/specfem3d_globe/compare/bc58e579b3b0838a0968725a076f5904845437ca...be63f20cbb6f462104e949894dbe205d2398cd7f

>---------------------------------------------------------------

commit 95124e51f6153ddf1cc2132f6212ae010ac11dd0
Author: daniel peter <peterda at ethz.ch>
Date:   Fri Aug 15 12:48:48 2014 +0200

    bug fix for gpu simulations with stacey absorbing boundaries; updates gpu kernel headers


>---------------------------------------------------------------

95124e51f6153ddf1cc2132f6212ae010ac11dd0
 src/gpu/assemble_MPI_scalar_gpu.c                  | 116 +++---
 src/gpu/assemble_MPI_vector_gpu.c                  | 157 ++++----
 src/gpu/boast/HEADER.rb                            |   1 +
 src/gpu/boast/compute_stacey_acoustic_kernel.rb    | 111 +++---
 src/gpu/boast/compute_stacey_elastic_kernel.rb     | 127 +++----
 src/gpu/boast/kernels.rb                           |  11 +-
 .../boast/references/get_maximum_scalar_kernel.cu  |   4 +-
 src/gpu/check_fields_gpu.c                         | 153 +++++---
 src/gpu/compute_add_sources_elastic_gpu.c          |  11 +-
 src/gpu/compute_coupling_gpu.c                     | 103 ++---
 src/gpu/compute_forces_crust_mantle_gpu.c          |  28 +-
 src/gpu/compute_forces_inner_core_gpu.c            |  27 +-
 src/gpu/compute_forces_outer_core_gpu.c            |  29 +-
 src/gpu/compute_kernels_gpu.c                      |  27 +-
 src/gpu/compute_stacey_acoustic_gpu.c              |  49 ++-
 src/gpu/compute_stacey_elastic_gpu.c               |  26 +-
 src/gpu/initialize_gpu.c                           | 417 ++++++++++++++-------
 .../assemble_boundary_accel_on_device.cu           |   1 +
 .../assemble_boundary_accel_on_device_cl.c         |   1 +
 .../assemble_boundary_potential_on_device.cu       |   1 +
 .../assemble_boundary_potential_on_device_cl.c     |   1 +
 src/gpu/kernels.gen/compute_acoustic_kernel.cu     |   1 +
 src/gpu/kernels.gen/compute_acoustic_kernel_cl.c   |   3 +-
 .../compute_add_sources_adjoint_kernel.cu          |   1 +
 .../compute_add_sources_adjoint_kernel_cl.c        |   1 +
 src/gpu/kernels.gen/compute_add_sources_kernel.cu  |   1 +
 .../kernels.gen/compute_add_sources_kernel_cl.c    |   1 +
 src/gpu/kernels.gen/compute_ani_kernel.cu          |   1 +
 src/gpu/kernels.gen/compute_ani_kernel_cl.c        |   3 +-
 src/gpu/kernels.gen/compute_ani_undo_att_kernel.cu |   1 +
 .../kernels.gen/compute_ani_undo_att_kernel_cl.c   |   5 +-
 .../compute_coupling_CMB_fluid_kernel.cu           |   1 +
 .../compute_coupling_CMB_fluid_kernel_cl.c         |   1 +
 .../compute_coupling_ICB_fluid_kernel.cu           |   1 +
 .../compute_coupling_ICB_fluid_kernel_cl.c         |   1 +
 .../compute_coupling_fluid_CMB_kernel.cu           |   1 +
 .../compute_coupling_fluid_CMB_kernel_cl.c         |   1 +
 .../compute_coupling_fluid_ICB_kernel.cu           |   1 +
 .../compute_coupling_fluid_ICB_kernel_cl.c         |   1 +
 .../kernels.gen/compute_coupling_ocean_kernel.cu   |   1 +
 .../kernels.gen/compute_coupling_ocean_kernel_cl.c |   1 +
 src/gpu/kernels.gen/compute_hess_kernel.cu         |   1 +
 src/gpu/kernels.gen/compute_hess_kernel_cl.c       |   1 +
 src/gpu/kernels.gen/compute_iso_kernel.cu          |   1 +
 src/gpu/kernels.gen/compute_iso_kernel_cl.c        |   1 +
 src/gpu/kernels.gen/compute_iso_undo_att_kernel.cu |   1 +
 .../kernels.gen/compute_iso_undo_att_kernel_cl.c   |   3 +-
 src/gpu/kernels.gen/compute_rho_kernel.cu          |   1 +
 src/gpu/kernels.gen/compute_rho_kernel_cl.c        |   1 +
 .../compute_stacey_acoustic_backward_kernel.cu     |   5 +-
 .../compute_stacey_acoustic_backward_kernel_cl.c   |   5 +-
 .../kernels.gen/compute_stacey_acoustic_kernel.cu  |  15 +-
 .../compute_stacey_acoustic_kernel_cl.c            |  15 +-
 .../compute_stacey_elastic_backward_kernel.cu      |   9 +-
 .../compute_stacey_elastic_backward_kernel_cl.c    |   9 +-
 .../kernels.gen/compute_stacey_elastic_kernel.cu   |  45 +--
 .../kernels.gen/compute_stacey_elastic_kernel_cl.c |  45 +--
 .../kernels.gen/compute_strength_noise_kernel.cu   |   1 +
 .../kernels.gen/compute_strength_noise_kernel_cl.c |   1 +
 .../crust_mantle_impl_kernel_adjoint.cu            |   1 +
 .../crust_mantle_impl_kernel_adjoint_cl.c          |  13 +-
 .../crust_mantle_impl_kernel_forward.cu            |   1 +
 .../crust_mantle_impl_kernel_forward_cl.c          |  13 +-
 src/gpu/kernels.gen/get_maximum_scalar_kernel.cu   |   1 +
 src/gpu/kernels.gen/get_maximum_scalar_kernel_cl.c |   1 +
 src/gpu/kernels.gen/get_maximum_vector_kernel.cu   |   1 +
 src/gpu/kernels.gen/get_maximum_vector_kernel_cl.c |   1 +
 .../kernels.gen/inner_core_impl_kernel_adjoint.cu  |   1 +
 .../inner_core_impl_kernel_adjoint_cl.c            |   7 +-
 .../kernels.gen/inner_core_impl_kernel_forward.cu  |   1 +
 .../inner_core_impl_kernel_forward_cl.c            |   7 +-
 .../noise_add_source_master_rec_kernel.cu          |   1 +
 .../noise_add_source_master_rec_kernel_cl.c        |   1 +
 .../kernels.gen/noise_add_surface_movie_kernel.cu  |   1 +
 .../noise_add_surface_movie_kernel_cl.c            |   1 +
 .../noise_transfer_surface_to_host_kernel.cu       |   1 +
 .../noise_transfer_surface_to_host_kernel_cl.c     |   1 +
 .../kernels.gen/outer_core_impl_kernel_adjoint.cu  |   1 +
 .../outer_core_impl_kernel_adjoint_cl.c            |   3 +-
 .../kernels.gen/outer_core_impl_kernel_forward.cu  |   1 +
 .../outer_core_impl_kernel_forward_cl.c            |   3 +-
 .../prepare_boundary_accel_on_device.cu            |   1 +
 .../prepare_boundary_accel_on_device_cl.c          |   1 +
 .../prepare_boundary_potential_on_device.cu        |   1 +
 .../prepare_boundary_potential_on_device_cl.c      |   1 +
 .../kernels.gen/update_accel_acoustic_kernel.cu    |   1 +
 .../kernels.gen/update_accel_acoustic_kernel_cl.c  |   1 +
 src/gpu/kernels.gen/update_accel_elastic_kernel.cu |   1 +
 .../kernels.gen/update_accel_elastic_kernel_cl.c   |   1 +
 src/gpu/kernels.gen/update_disp_veloc_kernel.cu    |   1 +
 src/gpu/kernels.gen/update_disp_veloc_kernel_cl.c  |   1 +
 src/gpu/kernels.gen/update_potential_kernel.cu     |   1 +
 src/gpu/kernels.gen/update_potential_kernel_cl.c   |   1 +
 .../kernels.gen/update_veloc_acoustic_kernel.cu    |   1 +
 .../kernels.gen/update_veloc_acoustic_kernel_cl.c  |   1 +
 src/gpu/kernels.gen/update_veloc_elastic_kernel.cu |   1 +
 .../kernels.gen/update_veloc_elastic_kernel_cl.c   |   1 +
 ...rite_seismograms_transfer_from_device_kernel.cu |   1 +
 ...te_seismograms_transfer_from_device_kernel_cl.c |   1 +
 ...ismograms_transfer_strain_from_device_kernel.cu |   1 +
 ...mograms_transfer_strain_from_device_kernel_cl.c |   1 +
 src/gpu/mesh_constants_cuda.h                      |  12 +-
 src/gpu/mesh_constants_gpu.h                       |  15 +-
 src/gpu/mesh_constants_ocl.h                       |  23 +-
 src/gpu/noise_tomography_gpu.c                     |  27 +-
 src/gpu/prepare_mesh_constants_gpu.c               | 417 +++++++++------------
 src/gpu/rules.mk                                   |  24 +-
 src/gpu/save_and_compare_cpu_vs_gpu.c              |   6 +-
 src/gpu/transfer_fields_gpu.c                      |  80 ++--
 src/gpu/update_displacement_gpu.c                  | 166 +++++---
 src/gpu/write_seismograms_gpu.c                    |  15 +-
 src/meshfem3D/create_regions_mesh_adios.f90        |   0
 src/meshfem3D/model_gll_adios.F90                  |   0
 src/shared/adios_helpers_writers.f90               |   0
 src/shared/asdf_helpers.f90                        |   2 +-
 src/shared/asdf_helpers_definitions.f90            |   2 +-
 src/shared/asdf_helpers_writers.f90                |   2 +-
 src/specfem3D/initialize_simulation.f90            |   3 +
 src/specfem3D/prepare_timerun.f90                  |  43 +--
 src/specfem3D/write_output_ASDF.F90                |   0
 .../gpuTrace/instr-ocl.c                           |   5 +-
 121 files changed, 1505 insertions(+), 1008 deletions(-)

Diff suppressed because of size. To see it, use:

    git diff-tree --root --patch-with-stat --no-color --find-copies-harder --ignore-space-at-eol --cc 95124e51f6153ddf1cc2132f6212ae010ac11dd0


More information about the CIG-COMMITS mailing list