-
Notifications
You must be signed in to change notification settings - Fork 15
/
Copy pathmem_manager.h
94 lines (82 loc) · 4.02 KB
/
mem_manager.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
/** ExaTensor::TAL-SH: Memory management API header.
REVISION: 2021/12/29
Copyright (C) 2014-2022 Dmitry I. Lyakh (Liakh)
Copyright (C) 2014-2022 Oak Ridge National Laboratory (UT-Battelle)
LICENSE: BSD 3-Clause
-------------------------------------------------------------------
**/
#ifndef MEM_MANAGER_H_
#define MEM_MANAGER_H_
#include <cstddef>
//Types:
// Generic slab:
typedef struct{
size_t max_entries; //max number of entries in the slab
size_t entry_size; //entry size in bytes (can be larger than the slab data type because of alignment)
size_t alignment; //optional alignment of entries with respect to the slab base
size_t first_free; //first free entry number (stack pointer)
void * slab_base; //slab base pointer
void ** free_entries; //stack of free entries
#ifndef NO_GPU
int mem_mapped; //non-zero if the underlying Host memory was allocated via cudaHostAlloc() as portable mapped
#endif
} slab_t;
//Exported functions:
extern "C"{
//Buffer memory management (all devices):
int arg_buf_allocate(size_t *arg_buf_size, int *arg_max, int gpu_beg, int gpu_end); //generic
int arg_buf_deallocate(int gpu_beg, int gpu_end); //generic
int arg_buf_clean_host(); //Host only
int arg_buf_clean_gpu(int gpu_num); //NVidia GPU only
void * get_arg_buf_ptr_host(); //Host only
void * get_arg_buf_ptr_gpu(int gpu_num); //Nvidia GPU only
size_t get_arg_buf_size_host(); //Host only
size_t get_arg_buf_size_gpu(int gpu_num); //Nvidia GPU only
size_t get_blck_max_size_host(); //Host only
size_t get_blck_max_size_gpu(int gpu_num); //Nvidia GPU only
int get_blck_buf_sizes_host(size_t *blck_sizes); //Host only
int get_blck_buf_sizes_gpu(int gpu_num, size_t *blck_sizes); //NVidia GPU only
void print_blck_buf_sizes_host(); //Host only
int get_buf_entry_host(size_t bsize, char **entry_ptr, int *entry_num); //Host only
int free_buf_entry_host(int entry_num); //Host only
int get_buf_entry_gpu(int gpu_num, size_t bsize, char **entry_ptr, int *entry_num); //NVidia GPU only
int free_buf_entry_gpu(int gpu_num, int entry_num); //NVidia GPU only
int const_args_entry_get(int gpu_num, int *entry_num); //NVidia GPU only
int const_args_entry_free(int gpu_num, int entry_num); //NVidia GPU only
int get_buf_entry_from_address(int dev_id, const void * addr); //generic
void mem_log_start(); //generic
void mem_log_finish(); //generic
int mem_free_left(int dev_id, size_t * free_mem); //generic
int mem_print_stats(int dev_id); //generic
int slab_create(slab_t ** slab);
int slab_clean(slab_t * slab);
#ifndef NO_GPU
int slab_construct(slab_t * slab, size_t slab_entry_size, size_t slab_max_entries, size_t align = 0, int mapped = 0);
#else
int slab_construct(slab_t * slab, size_t slab_entry_size, size_t slab_max_entries, size_t align = 0);
#endif
int slab_entry_get(slab_t * slab, void ** slab_entry);
int slab_entry_release(slab_t * slab, void * slab_entry);
int slab_get_base_ptr(slab_t * slab, void ** base_ptr);
int slab_get_max_entries(slab_t * slab, size_t * max_entries);
int slab_get_entry_size(slab_t * slab, size_t * entry_size);
int slab_get_entry_offset(slab_t * slab, void * slab_entry_p, size_t * entry_offset);
int slab_destruct(slab_t * slab);
int slab_destroy(slab_t * slab);
int host_mem_alloc(void **host_ptr, size_t tsize, size_t align = 1);
int host_mem_free(void *host_ptr);
int host_mem_alloc_pin(void **host_ptr, size_t tsize); //generic
int host_mem_free_pin(void *host_ptr); //generic
int host_mem_register(void *host_ptr, size_t tsize); //generic
int host_mem_unregister(void *host_ptr); //generic
int mem_allocate(int dev_id, size_t bytes, int in_buffer, void ** mem_ptr); //generic
int mem_free(int dev_id, void ** mem_ptr); // generic
int mi_entry_get(int ** mi_entry_p); //generic
int mi_entry_release(int * mi_entry_p); //generic
int mi_entry_pinned(int * mi_entry_p); //generic
#ifndef NO_GPU
int gpu_mem_alloc(void **dev_ptr, size_t tsize, int gpu_id = -1); //NVidia GPU only
int gpu_mem_free(void *dev_ptr, int gpu_id = -1); //NVidia GPU only
#endif /*NO_GPU*/
}
#endif /*MEM_MANAGER_H_*/