Changed default config to enabled NJIT & GPU for 50 iterations

This commit is contained in:
saundersp 2023-07-15 03:36:52 +02:00
parent 18afd40782
commit e40bbb999f
2 changed files with 7 additions and 8 deletions

View File

@ -6,14 +6,12 @@
#ifdef __CUDACC__ #ifdef __CUDACC__
#define NB_THREADS 1024 #define NB_THREADS 1024
#define NB_THREADS_2D_X 32 #define NB_THREADS_2D_X 32
#define NB_THREADS_2D_Y 32 #define NB_THREADS_2D_Y 32
__device__ constexpr const size_t M = 5; //log2(NB_THREADS_2D_Y));
#define NB_THREADS_3D_X 16 #define NB_THREADS_3D_X 16
#define NB_THREADS_3D_Y 16 #define NB_THREADS_3D_Y 16
#define NB_THREADS_3D_Z 4 #define NB_THREADS_3D_Z 4
__device__ constexpr const size_t M = 5; //log2(NB_THREADS_2D_Y));
#endif #endif
// Save state to avoid recalulation on restart // Save state to avoid recalulation on restart
@ -25,9 +23,9 @@ __device__ constexpr const size_t M = 5; //log2(NB_THREADS_2D_Y));
// Number of weak classifiers // Number of weak classifiers
// const size_t TS[] = { 1 }; // const size_t TS[] = { 1 };
// const size_t TS[] = { 1, 5, 10 }; // const size_t TS[] = { 1, 5, 10 };
// const size_t TS[] = { 1, 5, 10, 25, 50 }; const size_t TS[] = { 1, 5, 10, 25, 50 };
// const size_t TS[] = { 1, 5, 10, 25, 50, 100, 200, 300 }; // const size_t TS[] = { 1, 5, 10, 25, 50, 100, 200, 300 };
const size_t TS[] = { 1, 5, 10, 25, 50, 100, 200, 300, 400, 500, 1000 }; // const size_t TS[] = { 1, 5, 10, 25, 50, 100, 200, 300, 400, 500, 1000 };
// Enable verbose output (for debugging purposes) // Enable verbose output (for debugging purposes)
#define __DEBUG false #define __DEBUG false

View File

@ -14,16 +14,17 @@ SAVE_STATE = True
# Redo the state even if it's already saved # Redo the state even if it's already saved
FORCE_REDO = False FORCE_REDO = False
# Use NJIT to greatly accelerate runtime # Use NJIT to greatly accelerate runtime
COMPILE_WITH_C = False COMPILE_WITH_C = True
# Use GPU to greatly accelerate runtime (as priority over NJIT) # Use GPU to greatly accelerate runtime (as priority over NJIT)
GPU_BOOSTED = True GPU_BOOSTED = True
# Number of weak classifiers # Number of weak classifiers
# TS = [1] # TS = [1]
# TS = [1, 5, 10] # TS = [1, 5, 10]
# TS = [1, 5, 10, 25, 50] TS = [1, 5, 10, 25, 50]
# TS = [1, 5, 10, 25, 50, 100, 200] # TS = [1, 5, 10, 25, 50, 100, 200]
# TS = [1, 5, 10, 25, 50, 100, 200, 300] # TS = [1, 5, 10, 25, 50, 100, 200, 300]
TS = [1, 5, 10, 25, 50, 100, 200, 300, 400, 500, 1000] # TS = [1, 5, 10, 25, 50, 100, 200, 300, 400, 500, 1000]
# Enable verbose output (for debugging purposes) # Enable verbose output (for debugging purposes)
__DEBUG = False __DEBUG = False
# Debugging options # Debugging options