Codebase list votca-xtp / debian/1.6.2-2 include / votca / xtp / huffmantree.h
debian/1.6.2-2

Tree @debian/1.6.2-2 (Download .tar.gz)

huffmantree.h @debian/1.6.2-2raw · history · blame

/*
 * Copyright 2009-2019 The VOTCA Development Team (http://www.votca.org)
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 *
 */
#pragma once
#ifndef HUFFMANTREE_H
#define HUFFMANTREE_H
#include <list>
#include <queue>
#include <stdlib.h>
#include <vector>

namespace votca {
namespace xtp {

template <class T>
class huffmanTree {

 public:
  void makeTree() {
    if (!events) {
      throw std::runtime_error(
          "Error in Huffmantree::makeTree : Pointer to Events not set!");
    }

    // queue of the nodes, sorted by probability
    auto compare = [](huffmanNode<T> *n1, huffmanNode<T> *n2) {
      return n1->probability > n2->probability;
    };

    // priority queues, because the algorithm always needs the element with the
    // smallest probability. Also, it keep adding nodes to it, so it would we
    // very inefficient to sort it in every iteration.
    std::priority_queue<huffmanNode<T> *, std::vector<huffmanNode<T> *>,
                        decltype(compare)>
        queue(compare);

    htree = std::vector<huffmanNode<T>>(
        events->size() % 2 ? events->size() : events->size() - 1);

    auto comp2 = [](T *e1, T *e2) { return e1->getValue() > e2->getValue(); };
    std::priority_queue<T *, std::vector<T *>, decltype(comp2)> eventQueue(
        comp2);
    sum_of_values = 0.0;

    Index firstEmptyFieldIndex = 0;
    for (T &e : *events) {
      eventQueue.push(&e);
      sum_of_values += e.getValue();
    }
    while (eventQueue.size() > 1) {
      htree[firstEmptyFieldIndex].isOnLastLevel = true;
      htree[firstEmptyFieldIndex].leftLeaf = eventQueue.top();
      eventQueue.pop();
      htree[firstEmptyFieldIndex].rightLeaf = eventQueue.top();
      eventQueue.pop();
      htree[firstEmptyFieldIndex].probability =
          (htree[firstEmptyFieldIndex].leftLeaf->getValue() +
           htree[firstEmptyFieldIndex].rightLeaf->getValue()) /
          sum_of_values;
      queue.push(&(htree[firstEmptyFieldIndex]));
      firstEmptyFieldIndex++;
    }
    if (!eventQueue.empty()) {
      htree[firstEmptyFieldIndex].isOnLastLevel = true;
      htree[firstEmptyFieldIndex].rightLeaf = eventQueue.top();
      htree[firstEmptyFieldIndex].leftLeaf = eventQueue.top();
      htree[firstEmptyFieldIndex].probability =
          htree[firstEmptyFieldIndex].leftLeaf->getValue() / sum_of_values;
      queue.push(&(htree[firstEmptyFieldIndex]));
      firstEmptyFieldIndex++;
    }

    // now connect the hnodes, making a new one for every connection:
    // always take the two nodes with the smallest probability and "combine"
    // them, repeat, until just one node (the root) is left.
    huffmanNode<T> *h1;
    huffmanNode<T> *h2;
    while (queue.size() > 1) {
      h1 = queue.top();
      queue.pop();
      h2 = queue.top();
      queue.pop();
      htree[firstEmptyFieldIndex].probability =
          h1->probability + h2->probability;
      htree[firstEmptyFieldIndex].leftChild = h1;
      htree[firstEmptyFieldIndex].rightChild = h2;
      queue.push(&(htree[firstEmptyFieldIndex]));
      firstEmptyFieldIndex++;
    }
    // reorganize the probabilities: in every node, add the probability of one
    // subtree ("small") to all nodes of the other subtree.
    addProbabilityFromRightSubtreeToLeftSubtree(&htree[htree.size() - 1], 0);
    moveProbabilitiesFromRightSubtreesOneLevelUp(&htree[htree.size() - 1]);
    treeIsMade = true;
  }

  T *findHoppingDestination(double p) const {
    if (!treeIsMade) {
      throw std::runtime_error(
          "Tried to find Hopping Destination without initializing the "
          "Huffmantree first!");
    }
    const huffmanNode<T> *node = &htree.back();
    while (!node->isOnLastLevel) {
      if (p > node->probability) {
        node = node->leftChild;
      } else {
        node = node->rightChild;
      }
    }
    return (p > node->probability ? node->leftLeaf : node->rightLeaf);
  }

  void setEvents(std::vector<T> *v) { this->events = v; }

 private:
  template <class S>
  struct huffmanNode {
    // huffmanNode * for the inner nodes, T * for the nodes on the last level
    // before the leafs (The T themselves represent the "leaf" level)
    huffmanNode *leftChild;
    huffmanNode *rightChild;
    S *rightLeaf;
    S *leftLeaf;
    double probability;
    bool isOnLastLevel = false;
  };

  void addProbabilityFromRightSubtreeToLeftSubtree(huffmanNode<T> *n,
                                                   double add) {
    // for each node, adds the probability of the right childnode to the left
    // childnode and every node under it. if the Tree would look like this (with
    // the Numbers representing the probability of every node) before calling
    // this function

    //           1.0
    //       ____||____
    //      |          |
    //     0.4        0.6
    //     _||_      _||_
    //    |    |    |    |
    //  0.25 0.15  0.35 0.25
    //        _||_
    //       |    |
    //      0.1  0.05
    // then it would look like this after calling it
    //           1.0
    //       ____||____
    //      |          |
    //     1.0        0.6
    //     _||_      _||_
    //    |    |    |    |
    //   1.0 0.75  0.6  0.25
    //        _||_
    //       |    |
    //      0.75 0.65
    // now the tree could be traversed with "while (!n.isLeaf())
    // n=p>n.right.p?n.left:n.right" so in the function
    // moveProbabilitiesFromRightSubtreesOneLevelUp the numbers are moved one
    // level up to call n.p instead of n.right.p

    // adds "add" to the probability, then calls itself recursively.
    // this calculates the probabilities needed to traverse the tree quickly
    n->probability += add;
    // if leftId=-1 (=> node is leaf), returns
    if (n->isOnLastLevel) {
      return;
    }

    addProbabilityFromRightSubtreeToLeftSubtree(
        n->leftChild, add + n->rightChild->probability);
    addProbabilityFromRightSubtreeToLeftSubtree(n->rightChild, add);
  }

  void moveProbabilitiesFromRightSubtreesOneLevelUp(huffmanNode<T> *n) {
    // moves the Probabilities on the right subtrees one level up.
    // if the Tree would look like this (with the Numbers representing the
    // probability of every node) before calling this function
    //           1.0
    //       ____||____
    //      |          |
    //     1.0        0.6
    //     _||_      _||_
    //    |    |    |    |
    //   1.0 0.75  0.6  0.25
    //        _||_
    //       |    |
    //      0.75 0.65
    // then it would look like this after calling it
    //           0.
    //       ____||____
    //      |          |
    //     0.75      0.25
    //     _||_      _||_
    //    |    |    |    |
    //   1.0 0.65  0.6  0.25
    //        _||_
    //       |    |
    //     0.75  0.65
    // note, that now the probabilities on the leaf level are not needed anymore
    // to traverse the tree; the algorithm now is "while (!n.isLeaf())
    // n=p>n.p?n.left:n.right"
    if (n->isOnLastLevel) {
      n->probability -= n->leftLeaf->getValue() / sum_of_values;
    } else {
      n->probability = n->rightChild->probability;
      moveProbabilitiesFromRightSubtreesOneLevelUp(n->rightChild);
      moveProbabilitiesFromRightSubtreesOneLevelUp(n->leftChild);
    }
  }

  std::vector<huffmanNode<T>> htree;
  bool treeIsMade = false;
  double sum_of_values = 0.0;
  std::vector<T> *events = nullptr;
};

}  // namespace xtp
}  // namespace votca
#endif  // HUFFMANTREE_H