(git:ed6f26b)
Loading...
Searching...
No Matches
dbm_multiply_gpu_kernel.h
Go to the documentation of this file.
1
/*----------------------------------------------------------------------------*/
2
/* CP2K: A general program to perform molecular dynamics simulations */
3
/* Copyright 2000-2025 CP2K developers group <https://cp2k.org> */
4
/* */
5
/* SPDX-License-Identifier: BSD-3-Clause */
6
/*----------------------------------------------------------------------------*/
7
8
#ifndef DBM_MULTIPLY_GPU_KERNEL_H
9
#define DBM_MULTIPLY_GPU_KERNEL_H
10
11
#include "../offload/offload_runtime.h"
12
#if defined(__OFFLOAD) && !defined(__NO_OFFLOAD_DBM)
13
14
#include "
dbm_internal.h
"
15
16
#ifdef __cplusplus
17
extern
"C"
{
18
#endif
19
20
/*******************************************************************************
21
* \brief Internal routine for launching the GPU kernel.
22
* All arguments are assumed to be device pointers.
23
* \author Ole Schuett
24
******************************************************************************/
25
void
dbm_multiply_gpu_launch_kernel(
26
const
offloadStream_t stream,
const
double
alpha,
const
int
ntasks,
27
const
dbm_task_t
*tasks_host,
const
dbm_task_t
*tasks,
28
const
double
*pack_a_data,
const
double
*pack_b_data,
double
*shard_c_data);
29
30
#ifdef __cplusplus
31
}
32
#endif
33
34
#endif
// defined(__OFFLOAD) && !defined(__NO_OFFLOAD_DBM)
35
#endif
36
37
// EOF
dbm_internal.h
dbm_task_t
Internal struct for storing a task, ie. a single block multiplication.
Definition
dbm_internal.h:43
dbm
dbm_multiply_gpu_kernel.h
Generated by
1.9.8