]> git.uio.no Git - u/mrichter/AliRoot.git/blame - HLT/TPCLib/tracking-ca/AliHLTTPCCAGPUConfig.h
Removing annoying prints
[u/mrichter/AliRoot.git] / HLT / TPCLib / tracking-ca / AliHLTTPCCAGPUConfig.h
CommitLineData
a59a784e 1#ifndef ALIHLTTPCCAGPUCONFIG_H
2#define ALIHLTTPCCAGPUCONFIG_H
3
c7d6f78b 4//GPU Run Configuration
b647b430 5
43422963 6#ifdef RADEON
7#define HLTCA_GPU_BLOCK_COUNT_CONSTRUCTOR_MULTIPLIER 2
8#define HLTCA_GPU_BLOCK_COUNT_SELECTOR_MULTIPLIER 3
9#define HLTCA_GPU_THREAD_COUNT 256
10#define HLTCA_GPU_THREAD_COUNT_CONSTRUCTOR 256
11#define HLTCA_GPU_THREAD_COUNT_SELECTOR 256
12#define HLTCA_GPU_THREAD_COUNT_FINDER 256
2c3d0869 13#elif defined(KEPLER)
14#define HLTCA_GPU_BLOCK_COUNT_CONSTRUCTOR_MULTIPLIER 4
15#define HLTCA_GPU_BLOCK_COUNT_SELECTOR_MULTIPLIER 3
16#define HLTCA_GPU_THREAD_COUNT 256
17#define HLTCA_GPU_THREAD_COUNT_CONSTRUCTOR 512
18#define HLTCA_GPU_THREAD_COUNT_SELECTOR 256
19#define HLTCA_GPU_THREAD_COUNT_FINDER 256
43422963 20#elif defined(FERMI) || defined(__OPENCL__)
6f0cdd46 21#define HLTCA_GPU_BLOCK_COUNT_CONSTRUCTOR_MULTIPLIER 2
22#define HLTCA_GPU_BLOCK_COUNT_SELECTOR_MULTIPLIER 3
b647b430 23#define HLTCA_GPU_THREAD_COUNT 256
24#define HLTCA_GPU_THREAD_COUNT_CONSTRUCTOR 256
25#define HLTCA_GPU_THREAD_COUNT_SELECTOR 256
26#define HLTCA_GPU_THREAD_COUNT_FINDER 256
27#else
6f0cdd46 28#define HLTCA_GPU_BLOCK_COUNT_CONSTRUCTOR_MULTIPLIER 1
29#define HLTCA_GPU_BLOCK_COUNT_SELECTOR_MULTIPLIER 1
a59a784e 30#define HLTCA_GPU_THREAD_COUNT 256
b647b430 31#define HLTCA_GPU_THREAD_COUNT_CONSTRUCTOR 256
32#define HLTCA_GPU_THREAD_COUNT_SELECTOR 256
33#define HLTCA_GPU_THREAD_COUNT_FINDER 256
34#endif
a59a784e 35
e4818148 36#define HLTCA_GPU_DEFAULT_HELPER_THREADS 2 //Number of helper threads to speed up initialization/output
2fba026d 37
c7d6f78b 38//GPU Parameters
a59a784e 39#define HLTCA_GPU_WARP_SIZE 32
40#define HLTCA_GPU_REGS 64
c7d6f78b 41
e01a1f52 42#ifdef HLTCA_STANDALONE
43#define HLTCA_GPU_MERGER //Use GPU Merger
44#endif
2fba026d 45
c7d6f78b 46//Detector Parameters
a59a784e 47#define HLTCA_ROW_COUNT 159
48
c7d6f78b 49#define HLTCA_GPU_ROWALIGNMENT uint4 //Align Row Hits and Grid
50#define HLTCA_GPU_ROWCOPY int //must not be bigger than row alignment!!!
b22af1bf 51
c7d6f78b 52#define HLTCA_GPU_SCHED_ROW_STEP 32 //Amount of Rows to process in one step before rescheduling
53#define HLTCA_GPU_SCHED_FIXED_START //Assign each GPU thread a start tracklet to start with instead of using the scheduler to obtain start tracklet
e4818148 54//#define HLTCA_GPU_SCHED_FIXED_SLICE //Make each Multiprocessor on the GPU work only on a single slice during tracklet construction
c7d6f78b 55#define HLTCA_GPU_RESCHED //Use dynamic tracklet scheduling
b22af1bf 56
2fba026d 57#define HLTCA_GPU_ALTERNATIVE_SCHEDULER //Use alternative scheduling algorithm (makes upper 4 options obsolete)
e4818148 58#define HLTCA_GPU_ALTSCHED_STEPSIZE 80 //Number of rows to process in between of rescheduling
43422963 59#define HLTCA_GPU_ALTSCHED_MIN_THREADS 64 //Reschedule if less than n threads are active
2fba026d 60#define HLTCA_GPU_ALTERNATIVE_SCHEDULER_SIMPLE //Use simple version of alternative scheduler
61
2c3d0869 62#if !defined(FERMI) && !defined(KEPLER) && !defined(__OPENCL__)
6f0cdd46 63#define HLTCA_GPU_TEXTURE_FETCH //Fetch data through texture cache
f0bada7f 64#define HLTCA_GPU_TEXTURE_FETCHa //Fetch also in Neighbours Finder
b647b430 65#endif
b22af1bf 66
c7d6f78b 67//#define HLTCA_GPU_TRACKLET_CONSTRUCTOR_DO_PROFILE //Output Profiling Data for Tracklet Constructor Tracklet Scheduling
68//#define HLTCA_GPU_TIME_PROFILE //Output Time Profiling Data for asynchronous DMA transfer
2fba026d 69#define BITWISE_COMPATIBLE_DEBUG_OUTPUT //Make Debug Output of CPU and GPU bitwise compatible for comparison, also enable SORT_DUMPDATA!
6f0cdd46 70#define HLTCA_GPU_SORT_DUMPDATA //Sort Start Hits etc before dumping to file
b22af1bf 71
72#define HLTCA_GPU_TRACKLET_SELECTOR_HITS_REG_SIZE 12
73#define HLTCA_GPU_TRACKLET_SELECTOR_SLICE_COUNT 3 //Currently must be smaller than avaiable MultiProcessors on GPU or will result in wrong results
74
c7d6f78b 75#define HLTCA_GPU_MAX_TRACKLETS 12288 //Max Number of Tracklets that can be processed by GPU Tracker, Should be divisible by 16 at least
2fba026d 76#define HLTCA_GPU_MAX_TRACKS 1536 //Max number of Tracks that can be processd by GPU Tracker
b22af1bf 77
c7d6f78b 78//#define HLTCA_GPU_EMULATION_SINGLE_TRACKLET 1313 //Run Tracklet constructor on on single Tracklet in Device Emulation Mode
b22af1bf 79//#define HLTCA_GPU_EMULATION_DEBUG_TRACKLET 1313
80
b647b430 81//#define HLTCA_GPU_DEFAULT_MAX_SLICE_COUNT 12
1e63725a 82
c7d6f78b 83#define HLTCA_GPU_TRACKER_CONSTANT_MEM 65000 //Amount of Constant Memory to reserve
84
85#define HLTCA_GPU_TRACKER_OBJECT_MEMORY 1024 * 1024 //Total amount of Memory to reserve for GPU Tracker Objects
86#define HLTCA_GPU_ROWS_MEMORY 1024 * 1024 //Total amount of Memory to reserve for GPU Row Parameters
87#define HLTCA_GPU_COMMON_MEMORY 1024 * 1024 //Total amount of Memory to reserve for CommomMemoryStruct on GPU
2fba026d 88#define HLTCA_GPU_SLICE_DATA_MEMORY 6 * 1024 * 1024 //Amount of Slice Data Memory to reserve per Slice on GPU
89#define HLTCA_GPU_GLOBAL_MEMORY 13 * 1024 * 1024 //Amount of global temporary Memory to reserve per Slice on GPU
f0bada7f 90#define HLTCA_GPU_TRACKS_MEMORY 2 * 1024 * 1024 //Amount of Memory to reserve for Final Tracks per Slice on Host as Page Locked Memory
b22af1bf 91
c7d6f78b 92//Make sure options do not interfere
b22af1bf 93
94#ifndef HLTCA_GPUCODE
c7d6f78b 95//No texture fetch for CPU Tracker
b22af1bf 96#ifdef HLTCA_GPU_TEXTURE_FETCH
97#undef HLTCA_GPU_TEXTURE_FETCH
98#endif
f0bada7f 99#ifdef HLTCA_GPU_TEXTURE_FETCHa
100#undef HLTCA_GPU_TEXTURE_FETCHa
101#endif
1e63725a 102
c7d6f78b 103//Do not cache Row Hits during Tracklet selection in Registers for CPU Tracker
b22af1bf 104#undef HLTCA_GPU_TRACKLET_SELECTOR_HITS_REG_SIZE
105#define HLTCA_GPU_TRACKLET_SELECTOR_HITS_REG_SIZE 0
b22af1bf 106#else
c7d6f78b 107//Sort start hits for GPU tracker
b22af1bf 108#define HLTCA_GPU_SORT_STARTHITS
109#endif
110
c7d6f78b 111//Error Codes for GPU Tracker
b22af1bf 112#define HLTCA_GPU_ERROR_NONE 0
113#define HLTCA_GPU_ERROR_ROWBLOCK_TRACKLET_OVERFLOW 1
a59a784e 114#define HLTCA_GPU_ERROR_TRACKLET_OVERFLOW 2
115#define HLTCA_GPU_ERROR_TRACK_OVERFLOW 3
116#define HLTCA_GPU_ERROR_SCHEDULE_COLLISION 4
f0bada7f 117#define HLTCA_GPU_ERROR_WRONG_ROW 5
a59a784e 118
119#endif
b22af1bf 120