//===- StringHash.h -------------------------------------------------------===//
//
//                     The MCLinker Project
//
// This file is distributed under the University of Illinois Open Source
// License. See LICENSE.TXT for details.
//
//===----------------------------------------------------------------------===//
#ifndef MCLD_ADT_STRINGHASH_H_
#define MCLD_ADT_STRINGHASH_H_

#include <llvm/ADT/StringRef.h>
#include <llvm/Support/DataTypes.h>

#include <cassert>
#include <cctype>
#include <functional>

namespace mcld {
namespace hash {

enum Type { RS, JS, PJW, ELF, BKDR, SDBM, DJB, DEK, BP, FNV, AP, ES };

/** \class template<uint32_t TYPE> StringHash
 *  \brief the template StringHash class, for specification
 */
template <uint32_t TYPE>
struct StringHash
    : public std::unary_function<const llvm::StringRef, uint32_t> {
  uint32_t operator()(const llvm::StringRef pKey) const {
    assert(false && "Undefined StringHash function.\n");
    return 0;
  }
};

/** \class StringHash<RSHash>
 *  \brief RS StringHash funciton
 */
template <>
struct StringHash<RS>
    : public std::unary_function<const llvm::StringRef, uint32_t> {
  uint32_t operator()(const llvm::StringRef pKey) const {
    const unsigned int b = 378551;
    uint32_t a = 63689;
    uint32_t hash_val = 0;

    for (unsigned int i = 0; i < pKey.size(); ++i) {
      hash_val = hash_val * a + pKey[i];
      a = a * b;
    }
    return hash_val;
  }
};

/** \class StringHash<JSHash>
 *  \brief JS hash funciton
 */
template <>
struct StringHash<JS>
    : public std::unary_function<const llvm::StringRef, uint32_t> {
  uint32_t operator()(const llvm::StringRef pKey) const {
    uint32_t hash_val = 1315423911;

    for (unsigned int i = 0; i < pKey.size(); ++i) {
      hash_val ^= ((hash_val << 5) + pKey[i] + (hash_val >> 2));
    }
    return hash_val;
  }
};

/** \class StringHash<PJW>
 *  \brief P.J. Weinberger hash function
 */
template <>
struct StringHash<PJW>
    : public std::unary_function<const llvm::StringRef, uint32_t> {
  uint32_t operator()(const llvm::StringRef pKey) const {
    const unsigned int BitsInUnsignedInt =
        (unsigned int)(sizeof(unsigned int) * 8);
    const unsigned int ThreeQuarters =
        (unsigned int)((BitsInUnsignedInt * 3) / 4);
    const unsigned int OneEighth = (unsigned int)(BitsInUnsignedInt / 8);
    const unsigned int HighBits = (unsigned int)(0xFFFFFFFF)
                                  << (BitsInUnsignedInt - OneEighth);
    uint32_t hash_val = 0;
    uint32_t test = 0;

    for (unsigned int i = 0; i < pKey.size(); ++i) {
      hash_val = (hash_val << OneEighth) + pKey[i];

      if ((test = hash_val & HighBits) != 0) {
        hash_val = ((hash_val ^ (test >> ThreeQuarters)) & (~HighBits));
      }
    }
    return hash_val;
  }
};

/** \class StringHash<ELF>
 *  \brief ELF hash function.
 */
template <>
struct StringHash<ELF>
    : public std::unary_function<const llvm::StringRef, uint32_t> {
  uint32_t operator()(const llvm::StringRef pKey) const {
    uint32_t hash_val = 0;
    uint32_t x = 0;

    for (unsigned int i = 0; i < pKey.size(); ++i) {
      hash_val = (hash_val << 4) + pKey[i];
      if ((x = hash_val & 0xF0000000L) != 0)
        hash_val ^= (x >> 24);
      hash_val &= ~x;
    }
    return hash_val;
  }
};

/** \class StringHash<BKDR>
 *  \brief BKDR hash function
 */
template <>
struct StringHash<BKDR>
    : public std::unary_function<const llvm::StringRef, uint32_t> {
  uint32_t operator()(const llvm::StringRef pKey) const {
    const uint32_t seed = 131;
    uint32_t hash_val = 0;

    for (uint32_t i = 0; i < pKey.size(); ++i)
      hash_val = (hash_val * seed) + pKey[i];
    return hash_val;
  }
};

/** \class StringHash<SDBM>
 *  \brief SDBM hash function
 *  0.049s in 100000 test
 */
template <>
struct StringHash<SDBM>
    : public std::unary_function<const llvm::StringRef, uint32_t> {
  uint32_t operator()(const llvm::StringRef pKey) const {
    uint32_t hash_val = 0;

    for (uint32_t i = 0; i < pKey.size(); ++i)
      hash_val = pKey[i] + (hash_val << 6) + (hash_val << 16) - hash_val;
    return hash_val;
  }
};

/** \class StringHash<DJB>
 *  \brief DJB hash function
 *  0.057s in 100000 test
 */
template <>
struct StringHash<DJB>
    : public std::unary_function<const llvm::StringRef, uint32_t> {
  uint32_t operator()(const llvm::StringRef pKey) const {
    uint32_t hash_val = 5381;

    for (uint32_t i = 0; i < pKey.size(); ++i)
      hash_val = ((hash_val << 5) + hash_val) + pKey[i];

    return hash_val;
  }
};

/** \class StringHash<DEK>
 *  \brief DEK hash function
 *  0.60s
 */
template <>
struct StringHash<DEK>
    : public std::unary_function<const llvm::StringRef, uint32_t> {
  uint32_t operator()(const llvm::StringRef pKey) const {
    uint32_t hash_val = pKey.size();

    for (uint32_t i = 0; i < pKey.size(); ++i)
      hash_val = ((hash_val << 5) ^ (hash_val >> 27)) ^ pKey[i];

    return hash_val;
  }
};

/** \class StringHash<BP>
 *  \brief BP hash function
 *  0.057s
 */
template <>
struct StringHash<BP>
    : public std::unary_function<const llvm::StringRef, uint32_t> {
  uint32_t operator()(const llvm::StringRef pKey) const {
    uint32_t hash_val = 0;
    for (uint32_t i = 0; i < pKey.size(); ++i)
      hash_val = hash_val << 7 ^ pKey[i];

    return hash_val;
  }
};

/** \class StringHash<FNV>
 *  \brief FNV hash function
 *  0.058s
 */
template <>
struct StringHash<FNV>
    : public std::unary_function<const llvm::StringRef, uint32_t> {
  uint32_t operator()(const llvm::StringRef pKey) const {
    const uint32_t fnv_prime = 0x811C9DC5;
    uint32_t hash_val = 0;
    for (uint32_t i = 0; i < pKey.size(); ++i) {
      hash_val *= fnv_prime;
      hash_val ^= pKey[i];
    }

    return hash_val;
  }
};

/** \class StringHash<AP>
 *  \brief AP hash function
 *  0.060s
 */
template <>
struct StringHash<AP>
    : public std::unary_function<const llvm::StringRef, uint32_t> {
  uint32_t operator()(const llvm::StringRef pKey) const {
    unsigned int hash_val = 0xAAAAAAAA;

    for (uint32_t i = 0; i < pKey.size(); ++i) {
      hash_val ^= ((i & 1) == 0)
                      ? ((hash_val << 7) ^ pKey[i] * (hash_val >> 3))
                      : (~((hash_val << 11) + (pKey[i] ^ (hash_val >> 5))));
    }

    return hash_val;
  }
};

/** \class StringHash<ES>
 *  \brief This is a revision of Edward Sayers' string characteristic function.
 *
 *  31-28  27  26  25   -   0
 *  +----+---+---+------------+
 *  | .  | N | - | a/A  ~ z/Z |
 *  +----+---+---+------------+
 *
 *  . (bit 31~28) - The number of '.' characters
 *  N (bit 27)    - Are there any numbers in the string
 *  - (bit 26)    - Does the string have '-' character
 *  bit 25~0      - Bit 25 is set only if the string contains a 'a' or 'A', and
 *                  Bit 24 is set only if ...                   'b' or 'B', ...
 */
template <>
struct StringHash<ES>
    : public std::unary_function<const llvm::StringRef, uint32_t> {
  uint32_t operator()(const llvm::StringRef pString) const {
    uint32_t result = 0x0;
    unsigned int dot = 0;
    std::string::size_type idx;
    for (idx = 0; idx < pString.size(); ++idx) {
      int cur_char = pString[idx];

      if ('.' == cur_char) {
        ++dot;
        continue;
      }

      if (isdigit(cur_char)) {
        result |= (1 << 27);
        continue;
      }

      if ('_' == cur_char) {
        result |= (1 << 26);
        continue;
      }

      if (isupper(cur_char)) {
        result |= (1 << (cur_char - 'A'));
        continue;
      }

      if (islower(cur_char)) {
        result |= (1 << (cur_char - 'a'));
        continue;
      }
    }
    result |= (dot << 28);
    return result;
  }

  /** \func may_include
   *  \brief is it possible that pRule is a sub-string of pInString
   */
  static bool may_include(uint32_t pRule, uint32_t pInString) {
    uint32_t in_c = pInString << 4;
    uint32_t r_c = pRule << 4;

    uint32_t res = (in_c ^ r_c) & r_c;
    if (0 != res)
      return false;

    uint32_t in_dot = pInString >> 28;
    uint32_t r_dot = pRule >> 28;
    if (r_dot > in_dot)
      return false;

    return true;
  }
};

/** \class template<uint32_t TYPE> StringCompare
 *  \brief the template StringCompare class, for specification
 */
template <typename STRING_TYPE>
struct StringCompare : public std::binary_function<const STRING_TYPE&,
                                                   const STRING_TYPE&,
                                                   bool> {
  bool operator()(const STRING_TYPE& X, const STRING_TYPE& Y) const {
    return X == Y;
  }
};

template <>
struct StringCompare<const char*>
    : public std::binary_function<const char*, const char*, bool> {
  bool operator()(const char* X, const char* Y) const {
    return (std::strcmp(X, Y) == 0);
  }
};

template <>
struct StringCompare<char*>
    : public std::binary_function<const char*, const char*, bool> {
  bool operator()(const char* X, const char* Y) const {
    return (std::strcmp(X, Y) == 0);
  }
};

}  // namespace hash
}  // namespace mcld

#endif  // MCLD_ADT_STRINGHASH_H_