-
Notifications
You must be signed in to change notification settings - Fork 12
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Merge pull request #10 from edgargabriel/topic/ipc-context
topic/ipc context
- Loading branch information
Showing
7 changed files
with
729 additions
and
0 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -27,4 +27,5 @@ target_sources( | |
${PROJECT_NAME} | ||
PRIVATE | ||
ipc_policy.cpp | ||
context_ipc.cpp | ||
) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,129 @@ | ||
/****************************************************************************** | ||
* Copyright (c) 2024 Advanced Micro Devices, Inc. All rights reserved. | ||
* | ||
* Permission is hereby granted, free of charge, to any person obtaining a copy | ||
* of this software and associated documentation files (the "Software"), to | ||
* deal in the Software without restriction, including without limitation the | ||
* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or | ||
* sell copies of the Software, and to permit persons to whom the Software is | ||
* furnished to do so, subject to the following conditions: | ||
* | ||
* The above copyright notice and this permission notice shall be included in | ||
* all copies or substantial portions of the Software. | ||
* | ||
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR | ||
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, | ||
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE | ||
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER | ||
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING | ||
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS | ||
* IN THE SOFTWARE. | ||
*****************************************************************************/ | ||
|
||
#include "context_ipc.hpp" | ||
#include "context_ipc_tmpl_device.hpp" | ||
|
||
#include <hip/hip_runtime.h> | ||
#include <hip/amd_detail/amd_device_functions.h> | ||
#include <unistd.h> | ||
|
||
#include <cstdio> | ||
#include <cstdlib> | ||
|
||
#include "config.h" // NOLINT(build/include_subdir) | ||
#include "roc_shmem/roc_shmem.hpp" | ||
|
||
namespace rocshmem { | ||
|
||
__host__ IPCContext::IPCContext(Backend *b) | ||
: Context(b, false) { | ||
} | ||
|
||
__device__ void IPCContext::threadfence_system() { | ||
} | ||
|
||
__device__ void IPCContext::ctx_create() { | ||
} | ||
|
||
__device__ void IPCContext::ctx_destroy(){ | ||
} | ||
|
||
__device__ void IPCContext::putmem(void *dest, const void *source, size_t nelems, | ||
int pe) { | ||
} | ||
|
||
__device__ void IPCContext::getmem(void *dest, const void *source, size_t nelems, | ||
int pe) { | ||
} | ||
|
||
__device__ void IPCContext::putmem_nbi(void *dest, const void *source, | ||
size_t nelems, int pe) { | ||
} | ||
|
||
__device__ void IPCContext::getmem_nbi(void *dest, const void *source, | ||
size_t nelems, int pe) { | ||
} | ||
|
||
__device__ void IPCContext::fence() { | ||
} | ||
|
||
__device__ void IPCContext::fence(int pe) { | ||
} | ||
|
||
__device__ void IPCContext::quiet() { | ||
} | ||
|
||
__device__ void *IPCContext::shmem_ptr(const void *dest, int pe) { | ||
void *ret = nullptr; | ||
return ret; | ||
} | ||
|
||
__device__ void IPCContext::barrier_all() { | ||
__syncthreads(); | ||
} | ||
|
||
__device__ void IPCContext::sync_all() { | ||
__syncthreads(); | ||
} | ||
|
||
__device__ void IPCContext::sync(roc_shmem_team_t team) { | ||
__syncthreads(); | ||
} | ||
|
||
__device__ void IPCContext::putmem_wg(void *dest, const void *source, | ||
size_t nelems, int pe) { | ||
__syncthreads(); | ||
} | ||
|
||
__device__ void IPCContext::getmem_wg(void *dest, const void *source, | ||
size_t nelems, int pe) { | ||
__syncthreads(); | ||
} | ||
|
||
__device__ void IPCContext::putmem_nbi_wg(void *dest, const void *source, | ||
size_t nelems, int pe) { | ||
__syncthreads(); | ||
} | ||
|
||
__device__ void IPCContext::getmem_nbi_wg(void *dest, const void *source, | ||
size_t nelems, int pe) { | ||
__syncthreads(); | ||
} | ||
|
||
__device__ void IPCContext::putmem_wave(void *dest, const void *source, | ||
size_t nelems, int pe) { | ||
} | ||
|
||
__device__ void IPCContext::getmem_wave(void *dest, const void *source, | ||
size_t nelems, int pe) { | ||
} | ||
|
||
__device__ void IPCContext::putmem_nbi_wave(void *dest, const void *source, | ||
size_t nelems, int pe) { | ||
} | ||
|
||
__device__ void IPCContext::getmem_nbi_wave(void *dest, const void *source, | ||
size_t nelems, int pe) { | ||
} | ||
|
||
} // namespace rocshmem |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,241 @@ | ||
/****************************************************************************** | ||
* Copyright (c) 2024 Advanced Micro Devices, Inc. All rights reserved. | ||
* | ||
* Permission is hereby granted, free of charge, to any person obtaining a copy | ||
* of this software and associated documentation files (the "Software"), to | ||
* deal in the Software without restriction, including without limitation the | ||
* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or | ||
* sell copies of the Software, and to permit persons to whom the Software is | ||
* furnished to do so, subject to the following conditions: | ||
* | ||
* The above copyright notice and this permission notice shall be included in | ||
* all copies or substantial portions of the Software. | ||
* | ||
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR | ||
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, | ||
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE | ||
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER | ||
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING | ||
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS | ||
* IN THE SOFTWARE. | ||
*****************************************************************************/ | ||
|
||
#ifndef LIBRARY_SRC_IPC_CONTEXT_DEVICE_HPP_ | ||
#define LIBRARY_SRC_IPC_CONTEXT_DEVICE_HPP_ | ||
|
||
#include "../context.hpp" | ||
|
||
namespace rocshmem { | ||
|
||
class IPCContext : public Context { | ||
public: | ||
__host__ IPCContext(Backend *b); | ||
|
||
__device__ IPCContext(Backend *b); | ||
|
||
__device__ void threadfence_system(); | ||
|
||
__device__ void ctx_create(); | ||
|
||
__device__ void ctx_destroy(); | ||
|
||
__device__ void putmem(void *dest, const void *source, size_t nelems, int pe); | ||
|
||
__device__ void getmem(void *dest, const void *source, size_t nelems, int pe); | ||
|
||
__device__ void putmem_nbi(void *dest, const void *source, size_t nelems, | ||
int pe); | ||
|
||
__device__ void getmem_nbi(void *dest, const void *source, size_t size, | ||
int pe); | ||
|
||
__device__ void fence(); | ||
|
||
__device__ void fence(int pe); | ||
|
||
__device__ void quiet(); | ||
|
||
__device__ void *shmem_ptr(const void *dest, int pe); | ||
|
||
__device__ void barrier_all(); | ||
|
||
__device__ void sync_all(); | ||
|
||
__device__ void sync(roc_shmem_team_t team); | ||
|
||
template <typename T> | ||
__device__ void p(T *dest, T value, int pe); | ||
|
||
template <typename T> | ||
__device__ void put(T *dest, const T *source, size_t nelems, int pe); | ||
|
||
template <typename T> | ||
__device__ void put_nbi(T *dest, const T *source, size_t nelems, int pe); | ||
|
||
template <typename T> | ||
__device__ T g(const T *source, int pe); | ||
|
||
template <typename T> | ||
__device__ void get(T *dest, const T *source, size_t nelems, int pe); | ||
|
||
template <typename T> | ||
__device__ void get_nbi(T *dest, const T *source, size_t nelems, int pe); | ||
|
||
// Atomic operations | ||
template <typename T> | ||
__device__ void amo_add(void *dst, T value, int pe); | ||
|
||
template <typename T> | ||
__device__ void amo_set(void *dst, T value, int pe); | ||
|
||
template <typename T> | ||
__device__ T amo_swap(void *dst, T value, int pe); | ||
|
||
template <typename T> | ||
__device__ T amo_fetch_and(void *dst, T value, int pe); | ||
|
||
template <typename T> | ||
__device__ void amo_and(void *dst, T value, int pe); | ||
|
||
template <typename T> | ||
__device__ T amo_fetch_or(void *dst, T value, int pe); | ||
|
||
template <typename T> | ||
__device__ void amo_or(void *dst, T value, int pe); | ||
|
||
template <typename T> | ||
__device__ T amo_fetch_xor(void *dst, T value, int pe); | ||
|
||
template <typename T> | ||
__device__ void amo_xor(void *dst, T value, int pe); | ||
|
||
template <typename T> | ||
__device__ void amo_cas(void *dst, T value, T cond, int pe); | ||
|
||
template <typename T> | ||
__device__ T amo_fetch_add(void *dst, T value, int pe); | ||
|
||
template <typename T> | ||
__device__ T amo_fetch_cas(void *dst, T value, T cond, int pe); | ||
|
||
// Collectives | ||
template <typename T, ROC_SHMEM_OP Op> | ||
__device__ void to_all(T *dest, const T *source, int nreduce, int PE_start, | ||
int logPE_stride, int PE_size, T *pWrk, | ||
long *pSync); // NOLINT(runtime/int) | ||
|
||
template <typename T, ROC_SHMEM_OP Op> | ||
__device__ void to_all(roc_shmem_team_t team, T *dest, const T *source, | ||
int nreduce); | ||
|
||
template <typename T> | ||
__device__ void broadcast(roc_shmem_team_t team, T *dest, const T *source, | ||
int nelems, int pe_root); | ||
|
||
template <typename T> | ||
__device__ void broadcast(T *dest, const T *source, int nelems, int pe_root, | ||
int pe_start, int log_pe_stride, int pe_size, | ||
long *p_sync); // NOLINT(runtime/int) | ||
template <typename T> | ||
__device__ void alltoall(roc_shmem_team_t team, T *dest, const T *source, | ||
int nelems); | ||
template <typename T> | ||
__device__ void fcollect(roc_shmem_team_t team, T *dest, const T *source, | ||
int nelems); | ||
|
||
|
||
// Block/wave functions | ||
__device__ void putmem_wg(void *dest, const void *source, size_t nelems, | ||
int pe); | ||
|
||
__device__ void getmem_wg(void *dest, const void *source, size_t nelems, | ||
int pe); | ||
|
||
__device__ void putmem_nbi_wg(void *dest, const void *source, size_t nelems, | ||
int pe); | ||
|
||
__device__ void getmem_nbi_wg(void *dest, const void *source, size_t size, | ||
int pe); | ||
|
||
__device__ void putmem_wave(void *dest, const void *source, size_t nelems, | ||
int pe); | ||
|
||
__device__ void getmem_wave(void *dest, const void *source, size_t nelems, | ||
int pe); | ||
|
||
__device__ void putmem_nbi_wave(void *dest, const void *source, size_t nelems, | ||
int pe); | ||
|
||
__device__ void getmem_nbi_wave(void *dest, const void *source, size_t size, | ||
int pe); | ||
|
||
template <typename T> | ||
__device__ void put_wg(T *dest, const T *source, size_t nelems, int pe); | ||
|
||
template <typename T> | ||
__device__ void put_nbi_wg(T *dest, const T *source, size_t nelems, int pe); | ||
|
||
template <typename T> | ||
__device__ void put_wave(T *dest, const T *source, size_t nelems, int pe); | ||
|
||
template <typename T> | ||
__device__ void put_nbi_wave(T *dest, const T *source, size_t nelems, int pe); | ||
|
||
template <typename T> | ||
__device__ void get_wg(T *dest, const T *source, size_t nelems, int pe); | ||
|
||
template <typename T> | ||
__device__ void get_nbi_wg(T *dest, const T *source, size_t nelems, int pe); | ||
|
||
|
||
template <typename T> | ||
__device__ void get_wave(T *dest, const T *source, size_t nelems, int pe); | ||
|
||
template <typename T> | ||
__device__ void get_nbi_wave(T *dest, const T *source, size_t nelems, int pe); | ||
|
||
// Wait / Test functions | ||
template <typename T> | ||
__device__ void wait_until(T* ptr, roc_shmem_cmps cmp, T val); | ||
|
||
template <typename T> | ||
__device__ void wait_until_all(T* ptr, size_t nelems, | ||
const int *status, | ||
roc_shmem_cmps cmp, T val); | ||
|
||
template <typename T> | ||
__device__ size_t wait_until_any(T* ptr, size_t nelems, | ||
const int *status, | ||
roc_shmem_cmps cmp, T val); | ||
|
||
template <typename T> | ||
__device__ size_t wait_until_some(T* ptr, size_t nelems, | ||
size_t* indices, | ||
const int *status, | ||
roc_shmem_cmps cmp, T val); | ||
|
||
template <typename T> | ||
__device__ void wait_until_all_vector(T* ptr, size_t nelems, | ||
const int *status, | ||
roc_shmem_cmps cmp, T* vals); | ||
|
||
template <typename T> | ||
__device__ size_t wait_until_any_vector(T* ptr, size_t nelems, | ||
const int *status, | ||
roc_shmem_cmps cmp, T* vals); | ||
template <typename T> | ||
__device__ size_t wait_until_some_vector(T* ptr, size_t nelems, | ||
size_t* indices, | ||
const int *status, | ||
roc_shmem_cmps cmp, T* vals); | ||
|
||
template <typename T> | ||
__device__ int test(T* ptr, roc_shmem_cmps cmp, T val); | ||
|
||
private: | ||
|
||
}; | ||
|
||
} // namespace rocshmem | ||
|
||
#endif // LIBRARY_SRC_GPU_IB_CONTEXT_IB_DEVICE_HPP_ |
Oops, something went wrong.