aboutsummaryrefslogtreecommitdiff
path: root/matrix/generic/cumatrix.c
diff options
context:
space:
mode:
Diffstat (limited to 'matrix/generic/cumatrix.c')
-rw-r--r--matrix/generic/cumatrix.c15
1 files changed, 8 insertions, 7 deletions
diff --git a/matrix/generic/cumatrix.c b/matrix/generic/cumatrix.c
index 49e2620..2deb7a3 100644
--- a/matrix/generic/cumatrix.c
+++ b/matrix/generic/cumatrix.c
@@ -27,6 +27,7 @@
static cublasHandle_t cublas_handle;
Matrix *nerv_matrix_(new_)(long nrow, long ncol);
+void nerv_matrix_(data_free)(Matrix *self);
static void nerv_matrix_(add_)(const Matrix *a, const Matrix *b,
const Matrix *c,
@@ -98,9 +99,8 @@ static int nerv_matrix_(sigmoid)(lua_State *L) {
Matrix *a = luaT_checkudata(L, 1, nerv_matrix_(tname));
Matrix *b = luaT_checkudata(L, 2, nerv_matrix_(tname));
CHECK_SAME_DIMENSION(a, b);
- cudak_(cuda_sigmoid)(a, b);
- luaT_pushudata(L, b, nerv_matrix_(tname));
- return 1;
+ cudak_(cuda_sigmoid)(b, a);
+ return 0;
}
static int nerv_matrix_(sigmoid_grad)(lua_State *L) {
@@ -114,15 +114,16 @@ static int nerv_matrix_(sigmoid_grad)(lua_State *L) {
}
static int nerv_matrix_(softmax)(lua_State *L) {
- Matrix *a = luaT_checkudata(L, 1, nerv_matrix_(tname));
+ Matrix *a = luaT_checkudata(L, 2, nerv_matrix_(tname));
+ Matrix *b = luaT_checkudata(L, 1, nerv_matrix_(tname));
Matrix *max = nerv_matrix_(new_)(a->nrow, 1);
Matrix *dno = nerv_matrix_(new_)(a->nrow, 1);
- Matrix *b = nerv_matrix_(new_)(a->nrow, a->ncol);
cudak_(cuda_rowmax)(a, max);
cudak_(cuda_softmax_denominator)(a, max, dno);
cudak_(cuda_softmax_final)(a, max, dno, b);
- luaT_pushudata(L, b, nerv_matrix_(tname));
- return 1;
+ nerv_matrix_(data_free)(max);
+ nerv_matrix_(data_free)(dno);
+ return 0;
}
static int nerv_matrix_(rowsum)(lua_State *L) {