FlatIndex.cuh - OpenGrok cross reference for /dports/math/faiss/faiss-1.7.1/faiss/gpu/impl/FlatIndex.cuh

/**
 * Copyright (c) Facebook, Inc. and its affiliates.
 *
 * This source code is licensed under the MIT license found in the
 * LICENSE file in the root directory of this source tree.
 */

#pragma once

#include <faiss/MetricType.h>
#include <faiss/gpu/GpuResources.h>
#include <faiss/gpu/utils/DeviceTensor.cuh>
#include <faiss/gpu/utils/DeviceVector.cuh>

namespace faiss {
namespace gpu {

class GpuResources;

/// Holder of GPU resources for a particular flat index
class FlatIndex {
   public:
    FlatIndex(
            GpuResources* res,
            int dim,
            bool useFloat16,
            bool storeTransposed,
            MemorySpace space);

    /// Whether or not this flat index primarily stores data in float16
    bool getUseFloat16() const;

    /// Returns the number of vectors we contain
    int getSize() const;

    /// Returns the dimensionality of the vectors
    int getDim() const;

    /// Reserve storage that can contain at least this many vectors
    void reserve(size_t numVecs, cudaStream_t stream);

    /// Returns the vectors based on the type desired; the FlatIndex must be of
    /// the same type (float16 or float32) to not assert
    template <typename T>
    Tensor<T, 2, true>& getVectorsRef();

    /// Returns a reference to our vectors currently in use
    Tensor<float, 2, true>& getVectorsFloat32Ref();

    /// Returns a reference to our vectors currently in use (useFloat16 mode)
    Tensor<half, 2, true>& getVectorsFloat16Ref();

    /// Performs a copy of the vectors on the given device, converting
    /// as needed from float16
    DeviceTensor<float, 2, true> getVectorsFloat32Copy(cudaStream_t stream);

    /// Returns only a subset of the vectors
    DeviceTensor<float, 2, true> getVectorsFloat32Copy(
            int from,
            int num,
            cudaStream_t stream);

    void query(
            Tensor<float, 2, true>& vecs,
            int k,
            faiss::MetricType metric,
            float metricArg,
            Tensor<float, 2, true>& outDistances,
            Tensor<int, 2, true>& outIndices,
            bool exactDistance);

    void query(
            Tensor<half, 2, true>& vecs,
            int k,
            faiss::MetricType metric,
            float metricArg,
            Tensor<float, 2, true>& outDistances,
            Tensor<int, 2, true>& outIndices,
            bool exactDistance);

    /// Compute residual for set of vectors
    void computeResidual(
            Tensor<float, 2, true>& vecs,
            Tensor<int, 1, true>& listIds,
            Tensor<float, 2, true>& residuals);

    /// Gather vectors given the set of IDs
    void reconstruct(
            Tensor<int, 1, true>& listIds,
            Tensor<float, 2, true>& vecs);

    void reconstruct(
            Tensor<int, 2, true>& listIds,
            Tensor<float, 3, true>& vecs);

    /// Add vectors to ourselves; the pointer passed can be on the host
    /// or the device
    void add(const float* data, int numVecs, cudaStream_t stream);

    /// Free all storage
    void reset();

   private:
    /// Collection of GPU resources that we use
    GpuResources* resources_;

    /// Dimensionality of our vectors
    const int dim_;

    /// Float16 data format
    const bool useFloat16_;

    /// Store vectors in transposed layout for speed; makes addition to
    /// the index slower
    const bool storeTransposed_;

    /// Memory space for our allocations
    MemorySpace space_;

    /// How many vectors we have
    int num_;

    /// The underlying expandable storage
    DeviceVector<char> rawData_;

    /// Vectors currently in rawData_
    DeviceTensor<float, 2, true> vectors_;
    DeviceTensor<float, 2, true> vectorsTransposed_;

    /// Vectors currently in rawData_, float16 form
    DeviceTensor<half, 2, true> vectorsHalf_;
    DeviceTensor<half, 2, true> vectorsHalfTransposed_;

    /// Precomputed L2 norms
    DeviceTensor<float, 1, true> norms_;
};

} // namespace gpu
} // namespace faiss