this is an attempted Fix: T38679
Cycles GPU Performance Regression From my testing this (what i should have done in the first place) reduces the regression a lot. Lets hope it is enough or we have to go back to busy waiting.
This commit is contained in:
@@ -654,9 +654,6 @@ public:
|
|||||||
cuda_assert(cuFuncSetBlockShape(cuPathTrace, xthreads, ythreads, 1))
|
cuda_assert(cuFuncSetBlockShape(cuPathTrace, xthreads, ythreads, 1))
|
||||||
cuda_assert(cuLaunchGridAsync(cuPathTrace, xblocks, yblocks, cuStream))
|
cuda_assert(cuLaunchGridAsync(cuPathTrace, xblocks, yblocks, cuStream))
|
||||||
|
|
||||||
cuda_assert(cuEventRecord(tileDone, cuStream ))
|
|
||||||
cuda_assert(cuEventSynchronize(tileDone))
|
|
||||||
|
|
||||||
cuda_pop_context();
|
cuda_pop_context();
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -989,6 +986,8 @@ public:
|
|||||||
|
|
||||||
task->update_progress(tile);
|
task->update_progress(tile);
|
||||||
}
|
}
|
||||||
|
cuda_assert(cuEventRecord(tileDone, cuStream ))
|
||||||
|
cuda_assert(cuEventSynchronize(tileDone))
|
||||||
|
|
||||||
task->release_tile(tile);
|
task->release_tile(tile);
|
||||||
}
|
}
|
||||||
|
Reference in New Issue
Block a user