Skip to content

Commit

Permalink
Add 1.0.1 release from tugraz.at
Browse files Browse the repository at this point in the history
  • Loading branch information
ax3l committed Jan 6, 2014
1 parent 7846a65 commit 7aa00b9
Show file tree
Hide file tree
Showing 6 changed files with 1,272 additions and 0 deletions.
23 changes: 23 additions & 0 deletions CMakeLists.txt
Original file line number Diff line number Diff line change
@@ -0,0 +1,23 @@
project(ScatterAlloc)
cmake_minimum_required(VERSION 2.6)
set(CUDA_NVCC_FLAGS "-arch=sm_20;-use_fast_math;")
find_package(CUDA REQUIRED)
include_directories(${CUDA_INCLUDE_DIRS})
cuda_include_directories(${CUDA_INCLUDE_DIRS})

OPTION(CUDA_OUTPUT_INTERMEDIATE_CODE "Output ptx code" OFF)
if(CUDA_OUTPUT_INTERMEDIATE_CODE)
set(CUDA_NVCC_FLAGS "${CUDA_NVCC_FLAGS};-Xptxas;-v;--keep")
endif(CUDA_OUTPUT_INTERMEDIATE_CODE)

SET(CUDA_OPTIMIZATION_TYPE "unset" CACHE STRING "CUDA Optimization")
set_property(CACHE CUDA_OPTIMIZATION_TYPE PROPERTY STRINGS "unset;-G0;-O0;-O1;-O2;-O3")
if(NOT ${CUDA_OPTIMIZATION_TYPE} STREQUAL "unset")
set(CUDA_NVCC_FLAGS "${CUDA_NVCC_FLAGS};${CUDA_OPTIMIZATION_TYPE}")
endif()

cuda_add_executable(ScatterAllocExample
example.cu
${CMAKE_CURRENT_SOURCE_DIR}/tools/heap.cuh
${CMAKE_CURRENT_SOURCE_DIR}/tools/heap_impl.cuh
${CMAKE_CURRENT_SOURCE_DIR}/tools/utils.h)
29 changes: 29 additions & 0 deletions LICENSE
Original file line number Diff line number Diff line change
@@ -0,0 +1,29 @@
/*
ScatterAlloc: Massively Parallel Dynamic Memory Allocation for the GPU.
http://www.icg.tugraz.at/project/mvp

Copyright (C) 2012 Institute for Computer Graphics and Vision,
Graz University of Technology

Author(s): Markus Steinberger - steinberger ( at ) icg.tugraz.at
Bernhard Kainz - kainz ( at ) icg.tugraz.at
Michael Kenzel - kenzel ( at ) icg.tugraz.at

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
*/
131 changes: 131 additions & 0 deletions example.cu
Original file line number Diff line number Diff line change
@@ -0,0 +1,131 @@
/*
ScatterAlloc: Massively Parallel Dynamic Memory Allocation for the GPU.
http://www.icg.tugraz.at/project/mvp
Copyright (C) 2012 Institute for Computer Graphics and Vision,
Graz University of Technology
Author(s): Markus Steinberger - steinberger ( at ) icg.tugraz.at
Michael Kenzel - kenzel ( at ) icg.tugraz.at
Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:
The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
*/

#include <cuda.h>
typedef unsigned int uint;

//replace the cuda malloc and free calls
#define OVERWRITE_MALLOC
//set the template arguments using HEAPARGS
// pagesize ... byter per page
// accessblocks ... number of superblocks
// regionsize ... number of regions for meta data structur
// wastefactor ... how much memory can be wasted per alloc (multiplicative factor)
// use_coalescing ... combine memory requests of within each warp
// resetfreedpages ... allow pages to be reused with a different size
#define HEAPARGS 4096, 8, 16, 2, true, false
//include the scatter alloc heap
#include "tools/heap_impl.cuh"

#include "tools/utils.h"

#ifdef WIN32
#define WIN32_LEAN_AND_MEAN
#define NOMINMAX
#include <windows.h>
#include <conio.h>
#endif

#include <iostream>
#include <stdio.h>

void runexample(int cuda_device);


int main(int argc, char** argv)
{
try
{
int cuda_device = argc > 1 ? atoi(argv[1]) : 0;

cudaDeviceProp deviceProp;
cudaGetDeviceProperties(&deviceProp, cuda_device);
std::cout << "Using device: " << deviceProp.name << std::endl;

if( deviceProp.major < 2 ) {
std::cerr << "This GPU with Compute Capability " << deviceProp.major
<< "." << deviceProp.minor << " does not meet minimum requirements." << std::endl;
std::cerr << "A GPU with Compute Capability >= 2.0 is required." << std::endl;
return -2;
}

runexample(cuda_device);

cudaDeviceReset();
}
catch (const std::exception& e)
{
std::cout << e.what() << std::endl;
#ifdef WIN32
while (!_kbhit());
#endif
return -1;
}
catch (...)
{
std::cout << "unknown exception!" << std::endl;
#ifdef WIN32
while (!_kbhit());
#endif
return -1;
}

return 0;
}


__global__ void allocSomething(uint** parray)
{
parray[threadIdx.x + blockIdx.x*blockDim.x] = new uint[threadIdx.x % 4];
}
__global__ void freeSomething(uint** parray)
{
delete[] parray[threadIdx.x + blockIdx.x*blockDim.x];
}


void runexample(int cuda_device)
{
cudaSetDevice(cuda_device);

//init the heap
initHeap();
//you can also specify the size of the heap in bytes
//initHeap(8U*1024U*1024U);

size_t block = 128;
size_t grid = 64;

uint** data;
CUDA_CHECKED_CALL(cudaMalloc(&data, grid*block*sizeof(uint*)));
allocSomething<<<grid,block>>>(data);
CUDA_CHECKED_CALL(cudaDeviceSynchronize());
freeSomething<<<grid,block>>>(data);
CUDA_CHECKED_CALL(cudaDeviceSynchronize());
}
Loading

0 comments on commit 7aa00b9

Please sign in to comment.