]>
Commit | Line | Data |
---|---|---|
a59a784e | 1 | #ifndef ALIHLTTPCCAGPUCONFIG_H |
2 | #define ALIHLTTPCCAGPUCONFIG_H | |
3 | ||
c7d6f78b | 4 | //GPU Run Configuration |
b647b430 | 5 | |
6 | //#define FERMI | |
7 | ||
8 | #ifdef FERMI | |
6f0cdd46 | 9 | #define HLTCA_GPU_BLOCK_COUNT_CONSTRUCTOR_MULTIPLIER 2 |
10 | #define HLTCA_GPU_BLOCK_COUNT_SELECTOR_MULTIPLIER 3 | |
b647b430 | 11 | #define HLTCA_GPU_THREAD_COUNT 256 |
12 | #define HLTCA_GPU_THREAD_COUNT_CONSTRUCTOR 256 | |
13 | #define HLTCA_GPU_THREAD_COUNT_SELECTOR 256 | |
14 | #define HLTCA_GPU_THREAD_COUNT_FINDER 256 | |
15 | #else | |
6f0cdd46 | 16 | #define HLTCA_GPU_BLOCK_COUNT_CONSTRUCTOR_MULTIPLIER 1 |
17 | #define HLTCA_GPU_BLOCK_COUNT_SELECTOR_MULTIPLIER 1 | |
a59a784e | 18 | #define HLTCA_GPU_THREAD_COUNT 256 |
b647b430 | 19 | #define HLTCA_GPU_THREAD_COUNT_CONSTRUCTOR 256 |
20 | #define HLTCA_GPU_THREAD_COUNT_SELECTOR 256 | |
21 | #define HLTCA_GPU_THREAD_COUNT_FINDER 256 | |
22 | #endif | |
a59a784e | 23 | |
e4818148 | 24 | #define HLTCA_GPU_DEFAULT_HELPER_THREADS 2 //Number of helper threads to speed up initialization/output |
2fba026d | 25 | |
c7d6f78b | 26 | //GPU Parameters |
a59a784e | 27 | #define HLTCA_GPU_WARP_SIZE 32 |
28 | #define HLTCA_GPU_REGS 64 | |
c7d6f78b | 29 | |
e01a1f52 | 30 | #ifdef HLTCA_STANDALONE |
31 | #define HLTCA_GPU_MERGER //Use GPU Merger | |
32 | #endif | |
2fba026d | 33 | |
c7d6f78b | 34 | //Detector Parameters |
a59a784e | 35 | #define HLTCA_ROW_COUNT 159 |
36 | ||
c7d6f78b | 37 | #define HLTCA_GPU_ROWALIGNMENT uint4 //Align Row Hits and Grid |
38 | #define HLTCA_GPU_ROWCOPY int //must not be bigger than row alignment!!! | |
b22af1bf | 39 | |
c7d6f78b | 40 | #define HLTCA_GPU_SCHED_ROW_STEP 32 //Amount of Rows to process in one step before rescheduling |
41 | #define HLTCA_GPU_SCHED_FIXED_START //Assign each GPU thread a start tracklet to start with instead of using the scheduler to obtain start tracklet | |
e4818148 | 42 | //#define HLTCA_GPU_SCHED_FIXED_SLICE //Make each Multiprocessor on the GPU work only on a single slice during tracklet construction |
c7d6f78b | 43 | #define HLTCA_GPU_RESCHED //Use dynamic tracklet scheduling |
b22af1bf | 44 | |
2fba026d | 45 | #define HLTCA_GPU_ALTERNATIVE_SCHEDULER //Use alternative scheduling algorithm (makes upper 4 options obsolete) |
e4818148 | 46 | #define HLTCA_GPU_ALTSCHED_STEPSIZE 80 //Number of rows to process in between of rescheduling |
47 | #define HLTCA_GPU_ALTSCHED_MIN_THREADS 32 //Reschedule if less than n threads are active | |
2fba026d | 48 | #define HLTCA_GPU_ALTERNATIVE_SCHEDULER_SIMPLE //Use simple version of alternative scheduler |
49 | ||
b647b430 | 50 | #ifndef FERMI |
6f0cdd46 | 51 | #define HLTCA_GPU_TEXTURE_FETCH //Fetch data through texture cache |
f0bada7f | 52 | #define HLTCA_GPU_TEXTURE_FETCHa //Fetch also in Neighbours Finder |
b647b430 | 53 | #endif |
b22af1bf | 54 | |
c7d6f78b | 55 | //#define HLTCA_GPU_TRACKLET_CONSTRUCTOR_DO_PROFILE //Output Profiling Data for Tracklet Constructor Tracklet Scheduling |
56 | //#define HLTCA_GPU_TIME_PROFILE //Output Time Profiling Data for asynchronous DMA transfer | |
2fba026d | 57 | #define BITWISE_COMPATIBLE_DEBUG_OUTPUT //Make Debug Output of CPU and GPU bitwise compatible for comparison, also enable SORT_DUMPDATA! |
6f0cdd46 | 58 | #define HLTCA_GPU_SORT_DUMPDATA //Sort Start Hits etc before dumping to file |
b22af1bf | 59 | |
60 | #define HLTCA_GPU_TRACKLET_SELECTOR_HITS_REG_SIZE 12 | |
61 | #define HLTCA_GPU_TRACKLET_SELECTOR_SLICE_COUNT 3 //Currently must be smaller than avaiable MultiProcessors on GPU or will result in wrong results | |
62 | ||
c7d6f78b | 63 | #define HLTCA_GPU_MAX_TRACKLETS 12288 //Max Number of Tracklets that can be processed by GPU Tracker, Should be divisible by 16 at least |
2fba026d | 64 | #define HLTCA_GPU_MAX_TRACKS 1536 //Max number of Tracks that can be processd by GPU Tracker |
b22af1bf | 65 | |
c7d6f78b | 66 | //#define HLTCA_GPU_EMULATION_SINGLE_TRACKLET 1313 //Run Tracklet constructor on on single Tracklet in Device Emulation Mode |
b22af1bf | 67 | //#define HLTCA_GPU_EMULATION_DEBUG_TRACKLET 1313 |
68 | ||
b647b430 | 69 | //#define HLTCA_GPU_DEFAULT_MAX_SLICE_COUNT 12 |
1e63725a | 70 | |
c7d6f78b | 71 | #define HLTCA_GPU_TRACKER_CONSTANT_MEM 65000 //Amount of Constant Memory to reserve |
72 | ||
73 | #define HLTCA_GPU_TRACKER_OBJECT_MEMORY 1024 * 1024 //Total amount of Memory to reserve for GPU Tracker Objects | |
74 | #define HLTCA_GPU_ROWS_MEMORY 1024 * 1024 //Total amount of Memory to reserve for GPU Row Parameters | |
75 | #define HLTCA_GPU_COMMON_MEMORY 1024 * 1024 //Total amount of Memory to reserve for CommomMemoryStruct on GPU | |
2fba026d | 76 | #define HLTCA_GPU_SLICE_DATA_MEMORY 6 * 1024 * 1024 //Amount of Slice Data Memory to reserve per Slice on GPU |
77 | #define HLTCA_GPU_GLOBAL_MEMORY 13 * 1024 * 1024 //Amount of global temporary Memory to reserve per Slice on GPU | |
f0bada7f | 78 | #define HLTCA_GPU_TRACKS_MEMORY 2 * 1024 * 1024 //Amount of Memory to reserve for Final Tracks per Slice on Host as Page Locked Memory |
b22af1bf | 79 | |
c7d6f78b | 80 | //Make sure options do not interfere |
b22af1bf | 81 | |
82 | #ifndef HLTCA_GPUCODE | |
c7d6f78b | 83 | //No texture fetch for CPU Tracker |
b22af1bf | 84 | #ifdef HLTCA_GPU_TEXTURE_FETCH |
85 | #undef HLTCA_GPU_TEXTURE_FETCH | |
86 | #endif | |
f0bada7f | 87 | #ifdef HLTCA_GPU_TEXTURE_FETCHa |
88 | #undef HLTCA_GPU_TEXTURE_FETCHa | |
89 | #endif | |
1e63725a | 90 | |
c7d6f78b | 91 | //Do not cache Row Hits during Tracklet selection in Registers for CPU Tracker |
b22af1bf | 92 | #undef HLTCA_GPU_TRACKLET_SELECTOR_HITS_REG_SIZE |
93 | #define HLTCA_GPU_TRACKLET_SELECTOR_HITS_REG_SIZE 0 | |
b22af1bf | 94 | #else |
c7d6f78b | 95 | //Sort start hits for GPU tracker |
b22af1bf | 96 | #define HLTCA_GPU_SORT_STARTHITS |
97 | #endif | |
98 | ||
c7d6f78b | 99 | //Error Codes for GPU Tracker |
b22af1bf | 100 | #define HLTCA_GPU_ERROR_NONE 0 |
101 | #define HLTCA_GPU_ERROR_ROWBLOCK_TRACKLET_OVERFLOW 1 | |
a59a784e | 102 | #define HLTCA_GPU_ERROR_TRACKLET_OVERFLOW 2 |
103 | #define HLTCA_GPU_ERROR_TRACK_OVERFLOW 3 | |
104 | #define HLTCA_GPU_ERROR_SCHEDULE_COLLISION 4 | |
f0bada7f | 105 | #define HLTCA_GPU_ERROR_WRONG_ROW 5 |
a59a784e | 106 | |
107 | #endif | |
b22af1bf | 108 |