/** * Copyright (c) Facebook, Inc. and its affiliates. * * This source code is licensed under the MIT license found in the * LICENSE file in the root directory of this source tree. */ #pragma once #include namespace faiss { namespace gpu { // output[x][i] += input[i] for all x void runSumAlongColumns(Tensor& input, Tensor& output, cudaStream_t stream); #ifdef FAISS_USE_FLOAT16 void runSumAlongColumns(Tensor& input, Tensor& output, cudaStream_t stream); #endif // output[x][i] = input[i] for all x void runAssignAlongColumns(Tensor& input, Tensor& output, cudaStream_t stream); #ifdef FAISS_USE_FLOAT16 void runAssignAlongColumns(Tensor& input, Tensor& output, cudaStream_t stream); #endif // output[i][x] += input[i] for all x // If zeroClamp, output[i][x] = max(output[i][x] + input[i], 0) for all x void runSumAlongRows(Tensor& input, Tensor& output, bool zeroClamp, cudaStream_t stream); #ifdef FAISS_USE_FLOAT16 void runSumAlongRows(Tensor& input, Tensor& output, bool zeroClamp, cudaStream_t stream); #endif } } // namespace