14 #include "../utils/Float16.cuh" 
   15 #include "../utils/Tensor.cuh" 
   17 namespace faiss { 
namespace gpu {
 
   20 void runSumAlongColumns(Tensor<float, 1, true>& input,
 
   21                         Tensor<float, 2, true>& output,
 
   24 #ifdef FAISS_USE_FLOAT16 
   25 void runSumAlongColumns(Tensor<half, 1, true>& input,
 
   26                         Tensor<half, 2, true>& output,
 
   31 void runAssignAlongColumns(Tensor<float, 1, true>& input,
 
   32                            Tensor<float, 2, true>& output,
 
   35 #ifdef FAISS_USE_FLOAT16 
   36 void runAssignAlongColumns(Tensor<half, 1, true>& input,
 
   37                            Tensor<half, 2, true>& output,
 
   42 void runSumAlongRows(Tensor<float, 1, true>& input,
 
   43                      Tensor<float, 2, true>& output,
 
   46 #ifdef FAISS_USE_FLOAT16 
   47 void runSumAlongRows(Tensor<half, 1, true>& input,
 
   48                      Tensor<half, 2, true>& output,