aboutsummaryrefslogtreecommitdiff
path: root/nerv/lib/matrix/generic/cukernel.cu
diff options
context:
space:
mode:
authortxh18 <cloudygooseg@gmail.com>2015-10-28 16:29:29 +0800
committertxh18 <cloudygooseg@gmail.com>2015-10-28 16:29:29 +0800
commite0fa1a48cb9f91bfcfc60b732b6f137a7a2071ba (patch)
treed375f9684970bcfa2977d74074f949bf3f98107a /nerv/lib/matrix/generic/cukernel.cu
parentaf99db1c6bc4823cc6ff094f24e963acd4788ef1 (diff)
changed copy_rows_fromd_by_idx a bit to make it clearer
Diffstat (limited to 'nerv/lib/matrix/generic/cukernel.cu')
-rw-r--r--nerv/lib/matrix/generic/cukernel.cu8
1 files changed, 4 insertions, 4 deletions
diff --git a/nerv/lib/matrix/generic/cukernel.cu b/nerv/lib/matrix/generic/cukernel.cu
index 6c8e64a..d042d48 100644
--- a/nerv/lib/matrix/generic/cukernel.cu
+++ b/nerv/lib/matrix/generic/cukernel.cu
@@ -294,7 +294,7 @@ __global__ void cudak_(gen_col_idx)(MATRIX_ELEM *b,
}
__global__ void cudak_(copy_rows_by_idx)(const MATRIX_ELEM *a, MATRIX_ELEM *b,
- const MATRIX_ELEM *idx, int b_begin,
+ const MATRIX_ELEM *idx,
int nrow, int ncol, int stride) {
int j = blockIdx.x * blockDim.x + threadIdx.x;
int i = blockIdx.y * blockDim.y + threadIdx.y;
@@ -620,13 +620,13 @@ extern "C" {
}
void cudak_(cuda_copy_rows_by_idx)(const Matrix *a, Matrix *b,
- const Matrix *idx, int b_begin) {
+ const Matrix *idx, int idx_begin) {
dim3 threadsPerBlock(CUDA_THREADS_NN, 1);
dim3 numBlocks(CEIL_DIV(b->ncol, threadsPerBlock.x), b->nrow);
cudak_(copy_rows_by_idx)<<<numBlocks, threadsPerBlock>>> \
(MATRIX_ELEM_PTR(a), MATRIX_ELEM_PTR(b),
- MATRIX_ELEM_PTR(idx) + b_begin,
- b_begin, b->nrow, b->ncol, b->stride / sizeof(MATRIX_ELEM));
+ MATRIX_ELEM_PTR(idx) + idx_begin,
+ b->nrow, b->ncol, b->stride / sizeof(MATRIX_ELEM));
cudaStreamSynchronize(0);
}
}