@@ -151,7 +151,7 @@ typedef struct redux_ctx redux_ctx;
151151struct GpuReductionAttr {
152152 gpucontext * gpuCtx ;
153153 unsigned numProcs ;
154- size_t maxLg , maxL0 , maxGg , maxG0 , maxLM ;
154+ size_t maxL0 , maxG0 , maxLM ;
155155
156156 ga_reduce_op op ;
157157 int maxSrcDims ;
@@ -491,9 +491,7 @@ GPUARRAY_PUBLIC int GpuReductionAttr_new (GpuReductionAttr**
491491
492492 (* grAttr )-> gpuCtx = gpuCtx ;
493493 if (gpucontext_property (gpuCtx , GA_CTX_PROP_NUMPROCS , & (* grAttr )-> numProcs ) != GA_NO_ERROR ||
494- gpucontext_property (gpuCtx , GA_CTX_PROP_MAXLSIZE , & (* grAttr )-> maxLg ) != GA_NO_ERROR ||
495494 gpucontext_property (gpuCtx , GA_CTX_PROP_MAXLSIZE0 , & (* grAttr )-> maxL0 ) != GA_NO_ERROR ||
496- gpucontext_property (gpuCtx , GA_CTX_PROP_MAXGSIZE , & (* grAttr )-> maxGg ) != GA_NO_ERROR ||
497495 gpucontext_property (gpuCtx , GA_CTX_PROP_MAXGSIZE0 , & (* grAttr )-> maxG0 ) != GA_NO_ERROR ||
498496 gpucontext_property (gpuCtx , GA_CTX_PROP_LMEMSIZE , & (* grAttr )-> maxLM ) != GA_NO_ERROR ){
499497 free (* grAttr );
@@ -1606,7 +1604,6 @@ static int reduxGenInferProperties (GpuReduction* gr){
16061604
16071605static void reduxGenSetMaxBS (GpuReduction * gr ){
16081606 gr -> maxBS = gr -> grAttr .maxLM /reduxGenGetReduxStateSize (gr );
1609- gr -> maxBS = gr -> maxBS < gr -> grAttr .maxLg ? gr -> maxBS : gr -> grAttr .maxLg ;
16101607 gr -> maxBS = gr -> maxBS < gr -> grAttr .maxL0 ? gr -> maxBS : gr -> grAttr .maxL0 ;
16111608
16121609 /**
@@ -2856,7 +2853,6 @@ static int reduxGenSrcAxisIsSplit (GpuReduction* gr,
28562853static int reduxGenCompile (GpuReduction * gr ){
28572854 int ret , flags = 0 ;
28582855
2859- flags |= GA_USE_CLUDA ;
28602856 if (gr -> TS0tc == GA_HALF || gr -> TD0tc == GA_HALF ){
28612857 flags |= GA_USE_HALF |GA_USE_SMALL ;
28622858 }
@@ -3104,7 +3100,7 @@ static size_t reduxGenEstimateParallelism (const GpuReduction* gr){
31043100 */
31053101
31063102 size_t marginFactor = 16 ;
3107- return marginFactor * gr -> grAttr .numProcs * gr -> grAttr .maxLg ;
3103+ return marginFactor * gr -> grAttr .numProcs * gr -> grAttr .maxL0 ;
31083104}
31093105
31103106/**
0 commit comments