![]() |
Octopus
|
Data Types | |
type | accel_context_t |
interface | accel_create_blas_alpha_beta_buffer |
interface | accel_create_buffer |
type | accel_device_t |
interface | accel_get_device_pointer |
interface | accel_kernel_run |
type | accel_kernel_t |
type | accel_mem_t |
interface | accel_padded_size |
interface | accel_read_buffer |
interface | accel_release_blas_alpha_beta_buffer |
interface | accel_set_buffer_to_zero |
interface | accel_set_kernel_arg |
type | accel_t |
interface | accel_write_buffer |
Functions/Subroutines | |
pure logical function, public | accel_is_enabled () |
pure logical function, public | accel_allow_cpu_only () |
subroutine, public | accel_init (base_grp, namespace) |
subroutine, public | accel_end (namespace) |
integer(int64) function | accel_padded_size_i8 (nn) |
integer(int32) function | accel_padded_size_i4 (nn) |
subroutine | accel_create_buffer_4 (this, flags, type, size, set_zero, async) |
subroutine | accel_create_buffer_8 (this, flags, type, size, set_zero, async) |
subroutine, public | accel_release_buffer (this, async) |
subroutine, public | accel_ensure_buffer_size (buffer, flags, type, required_size, set_zero, async) |
logical pure function, public | accel_buffer_is_allocated (this) |
subroutine, public | accel_finish () |
subroutine | accel_set_kernel_arg_buffer (kernel, narg, buffer) |
subroutine | accel_set_kernel_arg_local (kernel, narg, type, size) |
subroutine | accel_kernel_run_8 (kernel, globalsizes, localsizes) |
subroutine | accel_kernel_run_4 (kernel, globalsizes, localsizes) |
integer pure function, public | accel_max_workgroup_size () |
integer function, public | accel_kernel_workgroup_size (kernel) |
subroutine, public | clblas_print_error (ierr, name) |
subroutine, public | clfft_print_error (ierr, name) |
subroutine | accel_set_buffer_to (buffer, type, val, nval, offset, async) |
subroutine | accel_set_buffer_to_zero_i8 (buffer, type, nval, offset, async) |
subroutine | accel_set_buffer_to_zero_i4 (buffer, type, nval, offset, async) |
subroutine | opencl_check_bandwidth () |
logical pure function, public | accel_use_shared_mem () |
subroutine | accel_kernel_global_init () |
subroutine | accel_kernel_global_end () |
subroutine, public | accel_kernel_build (this, file_name, kernel_name, flags) |
subroutine | accel_kernel_end (this) |
subroutine, public | accel_kernel_start_call (this, file_name, kernel_name, flags) |
integer(int64) pure function, public | accel_global_memory_size () |
integer(int64) pure function, public | accel_local_memory_size () |
integer pure function, public | accel_max_size_per_dim (dim) |
subroutine, public | accel_set_stream (stream_number) |
subroutine, public | accel_get_stream (stream_number) |
subroutine, public | accel_synchronize_all_streams () |
type(c_ptr) function, public | daccel_get_pointer_with_offset (buffer, offset) |
type(c_ptr) function, public | zaccel_get_pointer_with_offset (buffer, offset) |
subroutine, public | accel_clean_pointer (buffer) |
subroutine, public | accel_get_unfolded_size (size, grid_size, thread_block_size) |
Get unfolded size: some kernels (e.g. projectors) unfold the array across warps as an optimization. This is, however, only benefitial on Nvidia GPUs. More... | |
subroutine | daccel_write_buffer_single (this, data, async) |
subroutine | daccel_write_buffer_0 (this, n1, data, offset, async) |
subroutine | daccel_write_buffer_1 (this, n1, data, offset, async) |
subroutine | daccel_write_buffer_2 (this, n1, n2, data, offset, async) |
subroutine | daccel_write_buffer_3 (this, n1, n2, n3, data, offset, async) |
subroutine | daccel_write_buffer_0_int32 (this, n1, data, offset, async) |
subroutine | daccel_write_buffer_1_int32 (this, n1, data, offset, async) |
subroutine | daccel_write_buffer_2_int32 (this, n1, n2, data, offset, async) |
subroutine | daccel_write_buffer_3_int32 (this, n1, n2, n3, data, offset, async) |
subroutine | daccel_read_buffer_0 (this, n1, data, offset, async) |
subroutine | daccel_read_buffer_1 (this, n1, data, offset, async) |
subroutine | daccel_read_buffer_2 (this, n1, n2, data, offset, async) |
subroutine | daccel_read_buffer_3 (this, n1, n2, n3, data, offset, async) |
subroutine | daccel_read_buffer_0_int32 (this, n1, data, offset, async) |
subroutine | daccel_read_buffer_1_int32 (this, n1, data, offset, async) |
subroutine | daccel_read_buffer_2_int32 (this, n1, n2, data, offset, async) |
subroutine | daccel_read_buffer_3_int32 (this, n1, n2, n3, data, offset, async) |
subroutine | daccel_set_kernel_arg_data (kernel, narg, data) |
subroutine | daccel_get_device_pointer_1 (host_pointer, device_pointer, dimensions) |
subroutine | daccel_get_device_pointer_2 (host_pointer, device_pointer, dimensions) |
subroutine | daccel_get_device_pointer_3 (host_pointer, device_pointer, dimensions) |
subroutine | daccel_get_device_pointer_1l (host_pointer, device_pointer, dimensions) |
subroutine | daccel_get_device_pointer_2l (host_pointer, device_pointer, dimensions) |
subroutine | daccel_get_device_pointer_3l (host_pointer, device_pointer, dimensions) |
subroutine | daccel_create_blas_alpha_beta_buffer (this, data, async) |
subroutine | daccel_release_blas_alpha_beta_buffer (this, data, async) |
subroutine | zaccel_write_buffer_single (this, data, async) |
subroutine | zaccel_write_buffer_0 (this, n1, data, offset, async) |
subroutine | zaccel_write_buffer_1 (this, n1, data, offset, async) |
subroutine | zaccel_write_buffer_2 (this, n1, n2, data, offset, async) |
subroutine | zaccel_write_buffer_3 (this, n1, n2, n3, data, offset, async) |
subroutine | zaccel_write_buffer_0_int32 (this, n1, data, offset, async) |
subroutine | zaccel_write_buffer_1_int32 (this, n1, data, offset, async) |
subroutine | zaccel_write_buffer_2_int32 (this, n1, n2, data, offset, async) |
subroutine | zaccel_write_buffer_3_int32 (this, n1, n2, n3, data, offset, async) |
subroutine | zaccel_read_buffer_0 (this, n1, data, offset, async) |
subroutine | zaccel_read_buffer_1 (this, n1, data, offset, async) |
subroutine | zaccel_read_buffer_2 (this, n1, n2, data, offset, async) |
subroutine | zaccel_read_buffer_3 (this, n1, n2, n3, data, offset, async) |
subroutine | zaccel_read_buffer_0_int32 (this, n1, data, offset, async) |
subroutine | zaccel_read_buffer_1_int32 (this, n1, data, offset, async) |
subroutine | zaccel_read_buffer_2_int32 (this, n1, n2, data, offset, async) |
subroutine | zaccel_read_buffer_3_int32 (this, n1, n2, n3, data, offset, async) |
subroutine | zaccel_set_kernel_arg_data (kernel, narg, data) |
subroutine | zaccel_get_device_pointer_1 (host_pointer, device_pointer, dimensions) |
subroutine | zaccel_get_device_pointer_2 (host_pointer, device_pointer, dimensions) |
subroutine | zaccel_get_device_pointer_3 (host_pointer, device_pointer, dimensions) |
subroutine | zaccel_get_device_pointer_1l (host_pointer, device_pointer, dimensions) |
subroutine | zaccel_get_device_pointer_2l (host_pointer, device_pointer, dimensions) |
subroutine | zaccel_get_device_pointer_3l (host_pointer, device_pointer, dimensions) |
subroutine | zaccel_create_blas_alpha_beta_buffer (this, data, async) |
subroutine | zaccel_release_blas_alpha_beta_buffer (this, data, async) |
subroutine | iaccel_write_buffer_single (this, data, async) |
subroutine | iaccel_write_buffer_0 (this, n1, data, offset, async) |
subroutine | iaccel_write_buffer_1 (this, n1, data, offset, async) |
subroutine | iaccel_write_buffer_2 (this, n1, n2, data, offset, async) |
subroutine | iaccel_write_buffer_3 (this, n1, n2, n3, data, offset, async) |
subroutine | iaccel_write_buffer_0_int32 (this, n1, data, offset, async) |
subroutine | iaccel_write_buffer_1_int32 (this, n1, data, offset, async) |
subroutine | iaccel_write_buffer_2_int32 (this, n1, n2, data, offset, async) |
subroutine | iaccel_write_buffer_3_int32 (this, n1, n2, n3, data, offset, async) |
subroutine | iaccel_read_buffer_0 (this, n1, data, offset, async) |
subroutine | iaccel_read_buffer_1 (this, n1, data, offset, async) |
subroutine | iaccel_read_buffer_2 (this, n1, n2, data, offset, async) |
subroutine | iaccel_read_buffer_3 (this, n1, n2, n3, data, offset, async) |
subroutine | iaccel_read_buffer_0_int32 (this, n1, data, offset, async) |
subroutine | iaccel_read_buffer_1_int32 (this, n1, data, offset, async) |
subroutine | iaccel_read_buffer_2_int32 (this, n1, n2, data, offset, async) |
subroutine | iaccel_read_buffer_3_int32 (this, n1, n2, n3, data, offset, async) |
subroutine | iaccel_set_kernel_arg_data (kernel, narg, data) |
subroutine | iaccel_get_device_pointer_1 (host_pointer, device_pointer, dimensions) |
subroutine | iaccel_get_device_pointer_2 (host_pointer, device_pointer, dimensions) |
subroutine | iaccel_get_device_pointer_3 (host_pointer, device_pointer, dimensions) |
subroutine | iaccel_get_device_pointer_1l (host_pointer, device_pointer, dimensions) |
subroutine | iaccel_get_device_pointer_2l (host_pointer, device_pointer, dimensions) |
subroutine | iaccel_get_device_pointer_3l (host_pointer, device_pointer, dimensions) |
subroutine | iaccel_create_blas_alpha_beta_buffer (this, data, async) |
subroutine | iaccel_release_blas_alpha_beta_buffer (this, data, async) |
subroutine | laccel_write_buffer_single (this, data, async) |
subroutine | laccel_write_buffer_0 (this, n1, data, offset, async) |
subroutine | laccel_write_buffer_1 (this, n1, data, offset, async) |
subroutine | laccel_write_buffer_2 (this, n1, n2, data, offset, async) |
subroutine | laccel_write_buffer_3 (this, n1, n2, n3, data, offset, async) |
subroutine | laccel_write_buffer_0_int32 (this, n1, data, offset, async) |
subroutine | laccel_write_buffer_1_int32 (this, n1, data, offset, async) |
subroutine | laccel_write_buffer_2_int32 (this, n1, n2, data, offset, async) |
subroutine | laccel_write_buffer_3_int32 (this, n1, n2, n3, data, offset, async) |
subroutine | laccel_read_buffer_0 (this, n1, data, offset, async) |
subroutine | laccel_read_buffer_1 (this, n1, data, offset, async) |
subroutine | laccel_read_buffer_2 (this, n1, n2, data, offset, async) |
subroutine | laccel_read_buffer_3 (this, n1, n2, n3, data, offset, async) |
subroutine | laccel_read_buffer_0_int32 (this, n1, data, offset, async) |
subroutine | laccel_read_buffer_1_int32 (this, n1, data, offset, async) |
subroutine | laccel_read_buffer_2_int32 (this, n1, n2, data, offset, async) |
subroutine | laccel_read_buffer_3_int32 (this, n1, n2, n3, data, offset, async) |
subroutine | laccel_set_kernel_arg_data (kernel, narg, data) |
subroutine | laccel_get_device_pointer_1 (host_pointer, device_pointer, dimensions) |
subroutine | laccel_get_device_pointer_2 (host_pointer, device_pointer, dimensions) |
subroutine | laccel_get_device_pointer_3 (host_pointer, device_pointer, dimensions) |
subroutine | laccel_get_device_pointer_1l (host_pointer, device_pointer, dimensions) |
subroutine | laccel_get_device_pointer_2l (host_pointer, device_pointer, dimensions) |
subroutine | laccel_get_device_pointer_3l (host_pointer, device_pointer, dimensions) |
subroutine | laccel_create_blas_alpha_beta_buffer (this, data, async) |
subroutine | laccel_release_blas_alpha_beta_buffer (this, data, async) |
Variables | |
integer, parameter, public | accel_mem_read_only = 0 |
integer, parameter, public | accel_mem_read_write = 1 |
integer, parameter, public | accel_mem_write_only = 2 |
type(accel_t), public | accel |
type(accel_mem_t), save, public | zm_0_buffer |
type(accel_mem_t), save, public | zm_1_buffer |
type(accel_mem_t), save, public | dm_0_buffer |
type(accel_mem_t), save, public | dm_1_buffer |
type(accel_kernel_t), target, save, public | kernel_vpsi |
type(accel_kernel_t), target, save, public | kernel_vpsi_complex |
type(accel_kernel_t), target, save, public | kernel_vpsi_spinors |
type(accel_kernel_t), target, save, public | kernel_vpsi_spinors_complex |
type(accel_kernel_t), target, save, public | kernel_daxpy |
type(accel_kernel_t), target, save, public | kernel_zaxpy |
type(accel_kernel_t), target, save, public | kernel_copy |
type(accel_kernel_t), target, save, public | kernel_copy_complex_to_real |
type(accel_kernel_t), target, save, public | kernel_copy_real_to_complex |
type(accel_kernel_t), target, save, public | dpack |
type(accel_kernel_t), target, save, public | zpack |
type(accel_kernel_t), target, save, public | dunpack |
type(accel_kernel_t), target, save, public | zunpack |
type(accel_kernel_t), target, save, public | kernel_ghost_reorder |
type(accel_kernel_t), target, save, public | kernel_density_real |
type(accel_kernel_t), target, save, public | kernel_density_complex |
type(accel_kernel_t), target, save, public | kernel_density_spinors |
type(accel_kernel_t), target, save, public | kernel_phase |
type(accel_kernel_t), target, save, public | kernel_phase_spiral |
type(accel_kernel_t), target, save, public | dkernel_dot_matrix |
type(accel_kernel_t), target, save, public | zkernel_dot_matrix |
type(accel_kernel_t), target, save, public | zkernel_dot_matrix_spinors |
type(accel_kernel_t), target, save, public | dkernel_batch_axpy |
type(accel_kernel_t), target, save, public | zkernel_batch_axpy |
type(accel_kernel_t), target, save, public | dkernel_ax_function_py |
type(accel_kernel_t), target, save, public | zkernel_ax_function_py |
type(accel_kernel_t), target, save, public | dkernel_batch_dotp |
type(accel_kernel_t), target, save, public | zkernel_batch_dotp |
type(accel_kernel_t), target, save, public | dzmul |
type(accel_kernel_t), target, save, public | zzmul |
integer, parameter | opencl_gpu = -1 |
integer, parameter | opencl_cpu = -2 |
integer, parameter | opencl_accelerator = -3 |
integer, parameter | opencl_default = -4 |
integer, parameter | cl_plat_invalid = -1 |
integer, parameter | cl_plat_amd = -2 |
integer, parameter | cl_plat_nvidia = -3 |
integer, parameter | cl_plat_ati = -4 |
integer, parameter | cl_plat_intel = -5 |
integer, public | cl_status |
integer | buffer_alloc_count |
integer(int64) | allocated_mem |
type(accel_kernel_t), pointer | head |
type(alloc_cache_t) | memcache |
pure logical function, public accel_oct_m::accel_is_enabled |
pure logical function, public accel_oct_m::accel_allow_cpu_only |
subroutine, public accel_oct_m::accel_init | ( | type(mpi_grp_t), intent(inout) | base_grp, |
type(namespace_t), intent(in) | namespace | ||
) |
subroutine, public accel_oct_m::accel_end | ( | type(namespace_t), intent(in) | namespace | ) |
|
private |
|
private |
|
private |
|
private |
subroutine, public accel_oct_m::accel_release_buffer | ( | type(accel_mem_t), intent(inout) | this, |
logical, intent(in), optional | async | ||
) |
subroutine, public accel_oct_m::accel_ensure_buffer_size | ( | type(accel_mem_t), intent(inout) | buffer, |
integer, intent(in) | flags, | ||
type(type_t), intent(in) | type, | ||
integer, intent(in) | required_size, | ||
logical, intent(in) | set_zero, | ||
logical, intent(in), optional | async | ||
) |
logical pure function, public accel_oct_m::accel_buffer_is_allocated | ( | type(accel_mem_t), intent(in) | this | ) |
|
private |
|
private |
|
private |
|
private |
integer pure function, public accel_oct_m::accel_max_workgroup_size |
integer function, public accel_oct_m::accel_kernel_workgroup_size | ( | type(accel_kernel_t), intent(inout) | kernel | ) |
subroutine, public accel_oct_m::clblas_print_error | ( | integer, intent(in) | ierr, |
character(len=*), intent(in) | name | ||
) |
subroutine, public accel_oct_m::clfft_print_error | ( | integer, intent(in) | ierr, |
character(len=*), intent(in) | name | ||
) |
|
private |
|
private |
|
private |
logical pure function, public accel_oct_m::accel_use_shared_mem |
subroutine, public accel_oct_m::accel_kernel_build | ( | type(accel_kernel_t), intent(inout) | this, |
character(len=*), intent(in) | file_name, | ||
character(len=*), intent(in) | kernel_name, | ||
character(len=*), intent(in), optional | flags | ||
) |
|
private |
subroutine, public accel_oct_m::accel_kernel_start_call | ( | type(accel_kernel_t), intent(inout), target | this, |
character(len=*), intent(in) | file_name, | ||
character(len=*), intent(in) | kernel_name, | ||
character(len=*), intent(in), optional | flags | ||
) |
integer(int64) pure function, public accel_oct_m::accel_global_memory_size |
integer(int64) pure function, public accel_oct_m::accel_local_memory_size |
integer pure function, public accel_oct_m::accel_max_size_per_dim | ( | integer, intent(in) | dim | ) |
subroutine, public accel_oct_m::accel_set_stream | ( | integer, intent(in) | stream_number | ) |
subroutine, public accel_oct_m::accel_get_stream | ( | integer, intent(inout) | stream_number | ) |
subroutine, public accel_oct_m::accel_synchronize_all_streams |
type(c_ptr) function, public accel_oct_m::daccel_get_pointer_with_offset | ( | type(c_ptr), intent(in) | buffer, |
integer(int64), intent(in) | offset | ||
) |
type(c_ptr) function, public accel_oct_m::zaccel_get_pointer_with_offset | ( | type(c_ptr), intent(in) | buffer, |
integer(int64), intent(in) | offset | ||
) |
subroutine, public accel_oct_m::accel_clean_pointer | ( | type(c_ptr), intent(in) | buffer | ) |
subroutine, public accel_oct_m::accel_get_unfolded_size | ( | integer(int64), intent(in) | size, |
integer(int64), intent(out) | grid_size, | ||
integer(int64), intent(out) | thread_block_size | ||
) |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
integer, parameter, public accel_oct_m::accel_mem_read_only = 0 |
integer, parameter, public accel_oct_m::accel_mem_read_write = 1 |
integer, parameter, public accel_oct_m::accel_mem_write_only = 2 |
type(accel_mem_t), save, public accel_oct_m::zm_0_buffer |
type(accel_mem_t), save, public accel_oct_m::zm_1_buffer |
type(accel_mem_t), save, public accel_oct_m::dm_0_buffer |
type(accel_mem_t), save, public accel_oct_m::dm_1_buffer |
type(accel_kernel_t), target, save, public accel_oct_m::kernel_vpsi |
type(accel_kernel_t), target, save, public accel_oct_m::kernel_vpsi_complex |
type(accel_kernel_t), target, save, public accel_oct_m::kernel_vpsi_spinors |
type(accel_kernel_t), target, save, public accel_oct_m::kernel_vpsi_spinors_complex |
type(accel_kernel_t), target, save, public accel_oct_m::kernel_daxpy |
type(accel_kernel_t), target, save, public accel_oct_m::kernel_zaxpy |
type(accel_kernel_t), target, save, public accel_oct_m::kernel_copy |
type(accel_kernel_t), target, save, public accel_oct_m::kernel_copy_complex_to_real |
type(accel_kernel_t), target, save, public accel_oct_m::kernel_copy_real_to_complex |
type(accel_kernel_t), target, save, public accel_oct_m::dpack |
type(accel_kernel_t), target, save, public accel_oct_m::zpack |
type(accel_kernel_t), target, save, public accel_oct_m::dunpack |
type(accel_kernel_t), target, save, public accel_oct_m::zunpack |
type(accel_kernel_t), target, save, public accel_oct_m::kernel_ghost_reorder |
type(accel_kernel_t), target, save, public accel_oct_m::kernel_density_real |
type(accel_kernel_t), target, save, public accel_oct_m::kernel_density_complex |
type(accel_kernel_t), target, save, public accel_oct_m::kernel_density_spinors |
type(accel_kernel_t), target, save, public accel_oct_m::kernel_phase |
type(accel_kernel_t), target, save, public accel_oct_m::kernel_phase_spiral |
type(accel_kernel_t), target, save, public accel_oct_m::dkernel_dot_matrix |
type(accel_kernel_t), target, save, public accel_oct_m::zkernel_dot_matrix |
type(accel_kernel_t), target, save, public accel_oct_m::zkernel_dot_matrix_spinors |
type(accel_kernel_t), target, save, public accel_oct_m::dkernel_batch_axpy |
type(accel_kernel_t), target, save, public accel_oct_m::zkernel_batch_axpy |
type(accel_kernel_t), target, save, public accel_oct_m::dkernel_ax_function_py |
type(accel_kernel_t), target, save, public accel_oct_m::zkernel_ax_function_py |
type(accel_kernel_t), target, save, public accel_oct_m::dkernel_batch_dotp |
type(accel_kernel_t), target, save, public accel_oct_m::zkernel_batch_dotp |
type(accel_kernel_t), target, save, public accel_oct_m::dzmul |
type(accel_kernel_t), target, save, public accel_oct_m::zzmul |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |