mirror of
https://github.com/pjreddie/darknet.git
synced 2023-08-10 21:13:14 +03:00
Update to cudaDeviceSynchronize()
This commit is contained in:
parent
61c9d02ec4
commit
9b7afaca07
@ -229,7 +229,7 @@ void time_gpu(int TA, int TB, int m, int k, int n)
|
|||||||
clock_t start = clock(), end;
|
clock_t start = clock(), end;
|
||||||
for(i = 0; i<iter; ++i){
|
for(i = 0; i<iter; ++i){
|
||||||
gemm_gpu(TA,TB,m,n,k,1,a_cl,lda,b_cl,ldb,1,c_cl,n);
|
gemm_gpu(TA,TB,m,n,k,1,a_cl,lda,b_cl,ldb,1,c_cl,n);
|
||||||
cudaThreadSynchronize();
|
cudaDeviceSynchronize();
|
||||||
}
|
}
|
||||||
double flop = ((double)m)*n*(2.*k + 2.)*iter;
|
double flop = ((double)m)*n*(2.*k + 2.)*iter;
|
||||||
double gflop = flop/pow(10., 9);
|
double gflop = flop/pow(10., 9);
|
||||||
|
Loading…
Reference in New Issue
Block a user