docs/cppapi/Vector_8h_source.html

//

//  Copyright (C) 2004-2008 Greg Landrum and Rational Discovery LLC

//

//   @@ All Rights Reserved @@

//  This file is part of the RDKit.

//  The contents are covered by the terms of the BSD license

//  which is included in the file license.txt, found at the root

//  of the RDKit source tree.

//

#include <RDGeneral/export.h>

#ifndef __RD_VECTOR_H__

#define __RD_VECTOR_H__


#include <RDGeneral/Invariant.h>

#include <RDGeneral/utils.h>

#include <cmath>

#include <iostream>

#include <iomanip>

#include <cstdlib>

#include <cstring>

#include <ctime>

#include <boost/random.hpp>

#include <boost/smart_ptr.hpp>


static constexpr double zero_tolerance = 1.e-16;


namespace RDNumeric {


//! A class to represent vectors of numbers.

template <class TYPE>


class Vector {

 public:

  typedef boost::shared_array<TYPE> DATA_SPTR;


  //! Initialize with only a size.


  explicit Vector(unsigned int N) {

    d_size = N;

    TYPE *data = new TYPE[N];

    memset(static_cast<void *>(data), 0, d_size * sizeof(TYPE));

    d_data.reset(data);

  }


  //! Initialize with a size and default value.


  Vector(unsigned int N, TYPE val) {  //: Vector(N) {

    d_size = N;

    TYPE *data = new TYPE[N];


    unsigned int i;

    for (i = 0; i < N; i++) {

      data[i] = val;

    }

    d_data.reset(data);

  }


  //! Initialize from a smart pointer.

  /*!

    <b>NOTE:</b> the data is not copied in this case

  */


  Vector(unsigned int N, DATA_SPTR data) {  // TYPE *data) {

    d_size = N;

    d_data = data;

  }


  //! copy constructor

  /*! We make a copy of the other vector's data.

   */


  Vector(const Vector &other) {

    d_size = other.size();

    const TYPE *otherData = other.getData();

    TYPE *data = new TYPE[d_size];


    memcpy(static_cast<void *>(data), static_cast<const void *>(otherData),

           d_size * sizeof(TYPE));

    d_data.reset(data);

  }


  ~Vector() = default;


  //! return the size (dimension) of the vector

  unsigned int size() const { return d_size; }


  //! returns the value at a particular index


  inline TYPE getVal(unsigned int i) const {

    PRECONDITION(i < d_size, "bad index");

    return d_data[i];

  }


  //! sets the index at a particular value


  inline void setVal(unsigned int i, TYPE val) {

    PRECONDITION(i < d_size, "bad index");

    d_data[i] = val;

  }


  inline TYPE operator[](unsigned int i) const {

    PRECONDITION(i < d_size, "bad index");

    return d_data[i];

  }


  inline TYPE &operator[](unsigned int i) {

    PRECONDITION(i < d_size, "bad index");

    return d_data[i];

  }


  //! returns a pointer to our data array

  inline TYPE *getData() { return d_data.get(); }


  //! returns a const pointer to our data array


  inline const TYPE *getData() const {

    // return dp_data;

    return d_data.get();

  }


  //! Copy operator.

  /*! We make a copy of the other Vector's data.

   */


  Vector<TYPE> &assign(const Vector<TYPE> &other) {

    PRECONDITION(d_size == other.size(), "Size mismatch in vector copying");

    const TYPE *otherData = other.getData();

    memcpy(static_cast<void *>(d_data.get()),

           static_cast<const void *>(otherData), d_size * sizeof(TYPE));

    return *this;

  }


  //! elementwise addition, vectors must be the same size.


  Vector<TYPE> &operator+=(const Vector<TYPE> &other) {

    PRECONDITION(d_size == other.size(), "Size mismatch in vector addition");

    const TYPE *otherData = other.getData();

    TYPE *data = d_data.get();

    unsigned int i;

    for (i = 0; i < d_size; i++) {

      data[i] += otherData[i];

    }

    return *this;

  }


  //! elementwise subtraction, vectors must be the same size.


  Vector<TYPE> &operator-=(const Vector<TYPE> &other) {

    PRECONDITION(d_size == other.size(), "Size mismatch in vector subtraction");

    const TYPE *otherData = other.getData();

    TYPE *data = d_data.get();

    unsigned int i;

    for (i = 0; i < d_size; i++) {

      data[i] -= otherData[i];

    }

    return *this;

  }


  //! multiplication by a scalar


  Vector<TYPE> &operator*=(TYPE scale) {

    unsigned int i;

    for (i = 0; i < d_size; i++) {

      d_data[i] *= scale;

    }

    return *this;

  }


  //! division by a scalar


  Vector<TYPE> &operator/=(TYPE scale) {

    unsigned int i;

    for (i = 0; i < d_size; i++) {

      d_data[i] /= scale;

    }

    return *this;

  }


  //! L2 norm squared


  inline TYPE normL2Sq() const {

    TYPE res = (TYPE)0.0;

    unsigned int i;

    TYPE *data = d_data.get();

    for (i = 0; i < d_size; i++) {

      res += data[i] * data[i];

    }

    return res;

  }


  //! L2 norm

  inline TYPE normL2() const { return sqrt(this->normL2Sq()); }


  //! L1 norm


  inline TYPE normL1() const {

    TYPE res = (TYPE)0.0;

    unsigned int i;

    TYPE *data = d_data.get();

    for (i = 0; i < d_size; i++) {

      res += fabs(data[i]);

    }

    return res;

  }


  //! L-infinity norm


  inline TYPE normLinfinity() const {

    TYPE res = (TYPE)(-1.0);

    unsigned int i;

    TYPE *data = d_data.get();

    for (i = 0; i < d_size; i++) {

      if (fabs(data[i]) > res) {

        res = fabs(data[i]);

      }

    }

    return res;

  }


  //! \brief Gets the ID of the entry that has the largest absolute value

  //! i.e. the entry being used for the L-infinity norm


  inline unsigned int largestAbsValId() const {

    TYPE res = (TYPE)(-1.0);

    unsigned int i, id = d_size;

    TYPE *data = d_data.get();

    for (i = 0; i < d_size; i++) {

      if (fabs(data[i]) > res) {

        res = fabs(data[i]);

        id = i;

      }

    }

    return id;

  }


  //! \brief Gets the ID of the entry that has the largest value


  inline unsigned int largestValId() const {

    TYPE res = (TYPE)(-1.e8);

    unsigned int i, id = d_size;

    TYPE *data = d_data.get();

    for (i = 0; i < d_size; i++) {

      if (data[i] > res) {

        res = data[i];

        id = i;

      }

    }

    return id;

  }


  //! \brief Gets the ID of the entry that has the smallest value


  inline unsigned int smallestValId() const {

    TYPE res = (TYPE)(1.e8);

    unsigned int i, id = d_size;

    TYPE *data = d_data.get();

    for (i = 0; i < d_size; i++) {

      if (data[i] < res) {

        res = data[i];

        id = i;

      }

    }

    return id;

  }


  //! returns the dot product between two Vectors


  inline TYPE dotProduct(const Vector<TYPE> other) const {

    PRECONDITION(d_size == other.size(),

                 "Size mismatch in vector doct product");

    const TYPE *oData = other.getData();

    unsigned int i;

    TYPE res = (TYPE)(0.0);

    TYPE *data = d_data.get();

    for (i = 0; i < d_size; i++) {

      res += (data[i] * oData[i]);

    }

    return res;

  }


  //! Normalize the vector using the L2 norm


  inline void normalize() {

    TYPE val = this->normL2();

    if (val < zero_tolerance) {

      throw std::runtime_error("Cannot normalize a zero length vector");

    }

    (*this) /= val;

  }


  //! Set to a random unit vector


  inline void setToRandom(unsigned int seed = 0) {

    // we want to get our own RNG here instead of using the global

    // one.  This is related to Issue285.

    RDKit::rng_type generator(42u);

    RDKit::uniform_double dist(0, 1.0);

    RDKit::double_source_type randSource(generator, dist);

    if (seed > 0) {

      generator.seed(seed);

    } else {

      // we can't initialize using only clock(), because it's possible

      // that we'll get here fast enough that clock() will return 0

      // and generator.seed(0) is an error:

      generator.seed(clock() + 1);

    }


    unsigned int i;

    TYPE *data = d_data.get();

    for (i = 0; i < d_size; i++) {

      data[i] = randSource();

    }

    this->normalize();

  }


 private:

  unsigned int d_size;  //!< our length

  DATA_SPTR d_data;

  Vector<TYPE> &operator=(const Vector<TYPE> &other);

};


typedef Vector<double> DoubleVector;


//! returns the algebraic tanimoto similarity [defn' from JCIM 46:587-96 (2006)]

template <typename T>


double TanimotoSimilarity(const Vector<T> &v1, const Vector<T> &v2) {

  double numer = v1.dotProduct(v2);

  if (numer == 0.0) {

    return 0.0;

  }

  double denom = v1.normL2Sq() + v2.normL2Sq() - numer;

  if (denom == 0.0) {

    return 0.0;

  }

  return numer / denom;

}


}  // end of namespace RDNumeric


//! ostream operator for Vectors

template <typename TYPE>


std::ostream &operator<<(std::ostream &target,

                         const RDNumeric::Vector<TYPE> &vec) {

  unsigned int siz = vec.size();

  target << "Size: " << siz << " [";

  unsigned int i;

  for (i = 0; i < siz; i++) {

    target << std::setw(7) << std::setprecision(3) << vec.getVal(i) << ", ";

  }

  target << "]\n";

  return target;

}


#endif

Invariant.h

PRECONDITION
#define PRECONDITION(expr, mess)
Definition Invariant.h:109

zero_tolerance
static constexpr double zero_tolerance
Definition Vector.h:25

operator<<
std::ostream & operator<<(std::ostream &target, const RDNumeric::Vector< TYPE > &vec)
ostream operator for Vectors
Definition Vector.h:320

RDNumeric::Vector
A class to represent vectors of numbers.
Definition Vector.h:31

RDNumeric::Vector::normL2
TYPE normL2() const
L2 norm.
Definition Vector.h:179

RDNumeric::Vector::operator*=
Vector< TYPE > & operator*=(TYPE scale)
multiplication by a scalar
Definition Vector.h:150

RDNumeric::Vector::Vector
Vector(unsigned int N)
Initialize with only a size.
Definition Vector.h:36

RDNumeric::Vector::Vector
Vector(const Vector &other)
copy constructor
Definition Vector.h:67

RDNumeric::Vector::assign
Vector< TYPE > & assign(const Vector< TYPE > &other)
Copy operator.
Definition Vector.h:117

RDNumeric::Vector::operator[]
TYPE & operator[](unsigned int i)
Definition Vector.h:99

RDNumeric::Vector::normalize
void normalize()
Normalize the vector using the L2 norm.
Definition Vector.h:263

RDNumeric::Vector::setVal
void setVal(unsigned int i, TYPE val)
sets the index at a particular value
Definition Vector.h:89

RDNumeric::Vector::Vector
Vector(unsigned int N, TYPE val)
Initialize with a size and default value.
Definition Vector.h:44

RDNumeric::Vector::operator-=
Vector< TYPE > & operator-=(const Vector< TYPE > &other)
elementwise subtraction, vectors must be the same size.
Definition Vector.h:138

RDNumeric::Vector::operator+=
Vector< TYPE > & operator+=(const Vector< TYPE > &other)
elementwise addition, vectors must be the same size.
Definition Vector.h:126

RDNumeric::Vector::setToRandom
void setToRandom(unsigned int seed=0)
Set to a random unit vector.
Definition Vector.h:272

RDNumeric::Vector::size
unsigned int size() const
return the size (dimension) of the vector
Definition Vector.h:80

RDNumeric::Vector::normL1
TYPE normL1() const
L1 norm.
Definition Vector.h:182

RDNumeric::Vector::operator/=
Vector< TYPE > & operator/=(TYPE scale)
division by a scalar
Definition Vector.h:159

RDNumeric::Vector::~Vector
~Vector()=default

RDNumeric::Vector::normLinfinity
TYPE normLinfinity() const
L-infinity norm.
Definition Vector.h:193

RDNumeric::Vector::DATA_SPTR
boost::shared_array< TYPE > DATA_SPTR
Definition Vector.h:33

RDNumeric::Vector::normL2Sq
TYPE normL2Sq() const
L2 norm squared.
Definition Vector.h:168

RDNumeric::Vector::dotProduct
TYPE dotProduct(const Vector< TYPE > other) const
returns the dot product between two Vectors
Definition Vector.h:249

RDNumeric::Vector::largestValId
unsigned int largestValId() const
Gets the ID of the entry that has the largest value.
Definition Vector.h:221

RDNumeric::Vector::largestAbsValId
unsigned int largestAbsValId() const
Gets the ID of the entry that has the largest absolute value i.e. the entry being used for the L-infi...
Definition Vector.h:207

RDNumeric::Vector::getData
TYPE * getData()
returns a pointer to our data array
Definition Vector.h:105

RDNumeric::Vector::smallestValId
unsigned int smallestValId() const
Gets the ID of the entry that has the smallest value.
Definition Vector.h:235

RDNumeric::Vector::getVal
TYPE getVal(unsigned int i) const
returns the value at a particular index
Definition Vector.h:83

RDNumeric::Vector::getData
const TYPE * getData() const
returns a const pointer to our data array
Definition Vector.h:108

RDNumeric::Vector::operator[]
TYPE operator[](unsigned int i) const
Definition Vector.h:94

RDNumeric::Vector::Vector
Vector(unsigned int N, DATA_SPTR data)
Initialize from a smart pointer.
Definition Vector.h:59

export.h

RDKit::rng_type
boost::minstd_rand rng_type
Definition utils.h:36

RDKit::double_source_type
boost::variate_generator< rng_type &, uniform_double > double_source_type
Definition utils.h:40

RDKit::uniform_double
boost::uniform_real uniform_double
Definition utils.h:38

RDNumeric
Definition AlignPoints.h:18

RDNumeric::TanimotoSimilarity
double TanimotoSimilarity(const Vector< T > &v1, const Vector< T > &v2)
returns the algebraic tanimoto similarity [defn' from JCIM 46:587-96 (2006)]
Definition Vector.h:305

RDNumeric::DoubleVector
Vector< double > DoubleVector
Definition Vector.h:301

utils.h