Add files via upload
This commit is contained in:
parent
0a8a3a144b
commit
761f1eb91d
5 changed files with 121 additions and 33 deletions
|
@ -5,10 +5,15 @@
|
||||||
|
|
||||||
namespace py = pybind11;
|
namespace py = pybind11;
|
||||||
|
|
||||||
PYBIND11_MODULE(PySpikeGenerationCPU, m) {
|
PYBIND11_MODULE(PySpikeGenerationCPU, m)
|
||||||
|
{
|
||||||
m.doc() = "SpikeGenerationCPU Module";
|
m.doc() = "SpikeGenerationCPU Module";
|
||||||
py::class_<SpikeGenerationCPU>(m, "SpikeGenerationCPU")
|
py::class_<SpikeGenerationCPU>(m, "SpikeGenerationCPU")
|
||||||
.def(py::init<>())
|
.def(py::init<>())
|
||||||
|
.def("gpu_occupancy_export",
|
||||||
|
&SpikeGenerationCPU::gpu_occupancy_export)
|
||||||
|
.def("gpu_occupancy_import",
|
||||||
|
&SpikeGenerationCPU::gpu_occupancy_import)
|
||||||
.def("spike_generation",
|
.def("spike_generation",
|
||||||
&SpikeGenerationCPU::entrypoint);
|
&SpikeGenerationCPU::entrypoint);
|
||||||
}
|
}
|
||||||
|
|
|
@ -198,3 +198,23 @@ size_t SpikeGenerationCPU::lower_bound(float* data_ptr,
|
||||||
}
|
}
|
||||||
return start_of_range;
|
return start_of_range;
|
||||||
};
|
};
|
||||||
|
|
||||||
|
void SpikeGenerationCPU::gpu_occupancy_export(
|
||||||
|
size_t dim_x,
|
||||||
|
size_t dim_y,
|
||||||
|
size_t number_of_pattern,
|
||||||
|
size_t spike_dim,
|
||||||
|
int64_t setting_memory_addr,
|
||||||
|
size_t setting_dim_0,
|
||||||
|
size_t setting_dim_1)
|
||||||
|
{
|
||||||
|
return;
|
||||||
|
};
|
||||||
|
|
||||||
|
void SpikeGenerationCPU::gpu_occupancy_import(
|
||||||
|
int64_t setting_memory_addr,
|
||||||
|
size_t setting_dim_0,
|
||||||
|
size_t setting_dim_1)
|
||||||
|
{
|
||||||
|
return;
|
||||||
|
};
|
|
@ -6,33 +6,69 @@
|
||||||
#include <cctype>
|
#include <cctype>
|
||||||
#include <iostream>
|
#include <iostream>
|
||||||
|
|
||||||
class SpikeGenerationCPU {
|
class SpikeGenerationCPU
|
||||||
public:
|
{
|
||||||
|
public:
|
||||||
SpikeGenerationCPU();
|
SpikeGenerationCPU();
|
||||||
~SpikeGenerationCPU();
|
~SpikeGenerationCPU();
|
||||||
|
|
||||||
void entrypoint(
|
void entrypoint(
|
||||||
int64_t input_pointer_addr, int64_t input_dim_0, int64_t input_dim_1,
|
int64_t input_pointer_addr,
|
||||||
int64_t input_dim_2, int64_t input_dim_3,
|
int64_t input_dim_0,
|
||||||
int64_t random_values_pointer_addr, int64_t random_values_dim_0,
|
int64_t input_dim_1,
|
||||||
int64_t random_values_dim_1, int64_t random_values_dim_2,
|
int64_t input_dim_2,
|
||||||
int64_t random_values_dim_3, int64_t output_pointer_addr,
|
int64_t input_dim_3,
|
||||||
int64_t output_dim_0, int64_t output_dim_1, int64_t output_dim_2,
|
int64_t random_values_pointer_addr,
|
||||||
int64_t output_dim_3, int64_t number_of_cpu_processes);
|
int64_t random_values_dim_0,
|
||||||
|
int64_t random_values_dim_1,
|
||||||
|
int64_t random_values_dim_2,
|
||||||
|
int64_t random_values_dim_3,
|
||||||
|
int64_t output_pointer_addr,
|
||||||
|
int64_t output_dim_0,
|
||||||
|
int64_t output_dim_1,
|
||||||
|
int64_t output_dim_2,
|
||||||
|
int64_t output_dim_3,
|
||||||
|
int64_t number_of_cpu_processes);
|
||||||
|
|
||||||
private:
|
void gpu_occupancy_export(
|
||||||
void spike_generation(float* input_pointer, size_t input_dim_c0,
|
size_t dim_x,
|
||||||
size_t input_dim_c1, size_t input_dim_c2,
|
size_t dim_y,
|
||||||
|
size_t number_of_pattern,
|
||||||
|
size_t spike_dim,
|
||||||
|
int64_t setting_memory_addr,
|
||||||
|
size_t setting_dim_0,
|
||||||
|
size_t setting_dim_1);
|
||||||
|
|
||||||
|
void gpu_occupancy_import(
|
||||||
|
int64_t setting_memory_addr,
|
||||||
|
size_t setting_dim_0,
|
||||||
|
size_t setting_dim_1);
|
||||||
|
|
||||||
|
private:
|
||||||
|
void spike_generation(
|
||||||
|
float* input_pointer,
|
||||||
|
size_t input_dim_c0,
|
||||||
|
size_t input_dim_c1,
|
||||||
|
size_t input_dim_c2,
|
||||||
float* random_values_pointer,
|
float* random_values_pointer,
|
||||||
size_t random_values_dim_c0,
|
size_t random_values_dim_c0,
|
||||||
size_t random_values_dim_c1,
|
size_t random_values_dim_c1,
|
||||||
size_t random_values_dim_c2, int64_t* output_pointer,
|
size_t random_values_dim_c2,
|
||||||
size_t output_dim_c0, size_t output_dim_c1,
|
int64_t* output_pointer,
|
||||||
size_t output_dim_c2, size_t x_dim, size_t y_dim,
|
size_t output_dim_c0,
|
||||||
size_t spike_dim, size_t h_dim, size_t pattern_id);
|
size_t output_dim_c1,
|
||||||
|
size_t output_dim_c2,
|
||||||
|
size_t x_dim,
|
||||||
|
size_t y_dim,
|
||||||
|
size_t spike_dim,
|
||||||
|
size_t h_dim,
|
||||||
|
size_t pattern_id);
|
||||||
|
|
||||||
size_t lower_bound(float* data_ptr, size_t data_length,
|
size_t lower_bound(
|
||||||
size_t data_ptr_stride, float compare_to_value);
|
float* data_ptr,
|
||||||
|
size_t data_length,
|
||||||
|
size_t data_ptr_stride,
|
||||||
|
float compare_to_value);
|
||||||
};
|
};
|
||||||
|
|
||||||
#endif /* SPIKEGENERATIONCPU */
|
#endif /* SPIKEGENERATIONCPU */
|
||||||
|
|
|
@ -87,7 +87,7 @@ void SpikeGenerationGPU::entrypoint(
|
||||||
size_t x_dim = output_dim_2;
|
size_t x_dim = output_dim_2;
|
||||||
size_t y_dim = output_dim_2;
|
size_t y_dim = output_dim_2;
|
||||||
|
|
||||||
assert ((number_of_cpu_processes <= 0));
|
assert((number_of_cpu_processes <= 0));
|
||||||
|
|
||||||
gpu_spike_generation(
|
gpu_spike_generation(
|
||||||
input_pointer,
|
input_pointer,
|
||||||
|
@ -208,9 +208,9 @@ void SpikeGenerationGPU::gpu_spike_generation(
|
||||||
assert((x_dim < 65535));
|
assert((x_dim < 65535));
|
||||||
assert((y_dim < 65535));
|
assert((y_dim < 65535));
|
||||||
|
|
||||||
// //////////////////////////////////////
|
// //////////////////////////////////////
|
||||||
// Calculate the distribution on the GPU
|
// Calculate the distribution on the GPU
|
||||||
// //////////////////////////////////////
|
// //////////////////////////////////////
|
||||||
|
|
||||||
int min_grid_size;
|
int min_grid_size;
|
||||||
int block_size;
|
int block_size;
|
||||||
|
@ -222,6 +222,15 @@ void SpikeGenerationGPU::gpu_spike_generation(
|
||||||
status = cudaOccupancyMaxPotentialBlockSize(&min_grid_size, &block_size,
|
status = cudaOccupancyMaxPotentialBlockSize(&min_grid_size, &block_size,
|
||||||
(void*)kernel_spike_generation,
|
(void*)kernel_spike_generation,
|
||||||
dynamic_s_mem_size, max_threadable_tasks);
|
dynamic_s_mem_size, max_threadable_tasks);
|
||||||
|
if (status != cudaSuccess)
|
||||||
|
{
|
||||||
|
std::cerr << "CUDA Runtime Error at: "
|
||||||
|
<< __FILE__
|
||||||
|
<< ":"
|
||||||
|
<< __LINE__
|
||||||
|
<< std::endl;
|
||||||
|
std::cerr << cudaGetErrorString(status) << std::endl;
|
||||||
|
}
|
||||||
assert((status == cudaSuccess));
|
assert((status == cudaSuccess));
|
||||||
|
|
||||||
grid_size = ((number_of_pattern * spike_dim) + block_size - 1) / block_size;
|
grid_size = ((number_of_pattern * spike_dim) + block_size - 1) / block_size;
|
||||||
|
@ -248,8 +257,17 @@ void SpikeGenerationGPU::gpu_spike_generation(
|
||||||
h_dim,
|
h_dim,
|
||||||
(number_of_pattern * spike_dim));
|
(number_of_pattern * spike_dim));
|
||||||
|
|
||||||
cudaDeviceSynchronize();
|
status = cudaDeviceSynchronize();
|
||||||
|
if (status != cudaSuccess)
|
||||||
|
{
|
||||||
|
std::cerr << "CUDA Runtime Error at: "
|
||||||
|
<< __FILE__
|
||||||
|
<< ":"
|
||||||
|
<< __LINE__
|
||||||
|
<< std::endl;
|
||||||
|
std::cerr << cudaGetErrorString(status) << std::endl;
|
||||||
|
}
|
||||||
|
assert((status == cudaSuccess));
|
||||||
return;
|
return;
|
||||||
};
|
};
|
||||||
|
|
||||||
|
|
|
@ -98,6 +98,15 @@ void occupancy_kernel_spike_generation(
|
||||||
status = cudaOccupancyMaxPotentialBlockSize(
|
status = cudaOccupancyMaxPotentialBlockSize(
|
||||||
&min_grid_size, &thread_block_size, (void*)kernel_spike_generation, 0,
|
&min_grid_size, &thread_block_size, (void*)kernel_spike_generation, 0,
|
||||||
max_threadable_tasks);
|
max_threadable_tasks);
|
||||||
|
if (status != cudaSuccess)
|
||||||
|
{
|
||||||
|
std::cerr << "CUDA Runtime Error at: "
|
||||||
|
<< __FILE__
|
||||||
|
<< ":"
|
||||||
|
<< __LINE__
|
||||||
|
<< std::endl;
|
||||||
|
std::cerr << cudaGetErrorString(status) << std::endl;
|
||||||
|
}
|
||||||
assert((status == cudaSuccess));
|
assert((status == cudaSuccess));
|
||||||
|
|
||||||
grid_size =
|
grid_size =
|
||||||
|
|
Loading…
Reference in a new issue