aboutsummaryrefslogblamecommitdiff
path: root/matrix/generic/cukernel.cu
blob: fdab356631379b65e6e30389da035e88511f928f (plain) (tree)
1
2
3
4
5
6
7
8
9




                            
                  
                         
                                                             
                                              




                                                                       
                    

                                       


                                    












                                                                            









                                                                     











                                                                     










                                                                           
                                                                     


                                                                                 













                                                                           

















                                                                           



















                                                                                       
                                                                             


















                                                                              
                                                                     


                                                                                 








                                                                           


                                                              






                                                                   

































                                                                                     







                                                                              







                                                                         































                                                                           
 








                                                                        







                                                                     

                        
                                                            
                                                             








                                                                
                                                             







                                                                
                                                           
                                                             






                                                                      

                                                                      
                                                             








                                                               
                                                          






                                                                                      
                                                                                     





                                                                           
                                                                                     





                                                                           





















                                                                                      


                                                          
                                                     

















                                                                                      

                                                                       
                                                             


















                                                                                          

                                                              






                                                                           

                                                              





                                                                           
                                                          






                                                                                      
                                                                                     





                                                                           
                                                                                     




                                                                           
 




























                                                                                                 

                                                                        
                                                             





                                                                      

                                                   
                                                             





                                                            































                                                                           









                                                                

      
#ifdef NERV_GENERIC_CUKERNEL
#include <assert.h>
#include <stdio.h>
#include "matrix.h"
#include "cuda.h"
#include "float.h"
#define CUDA_THREADS_N 16
#define CUDA_THREADS_NN ((CUDA_THREADS_N) * (CUDA_THREADS_N))
#define CEIL_DIV(a, b) (((a) + (b) - 1) / (b))
__global__ void cudak_(