0cf4b600e9
Change-Id: Ia2b137231437f6c3c0f4af49fba1a7bdc320ed4a
301 lines
8.6 KiB
C++
301 lines
8.6 KiB
C++
/* -*- Mode:C++; c-file-style:"gnu"; indent-tabs-mode:nil; -*- */
|
|
/*
|
|
* Copyright (c) 2014-2019, The University of Memphis
|
|
*
|
|
* This file is part of PSync.
|
|
* See AUTHORS.md for complete list of PSync authors and contributors.
|
|
*
|
|
* PSync is free software: you can redistribute it and/or modify it under the terms
|
|
* of the GNU Lesser General Public License as published by the Free Software Foundation,
|
|
* either version 3 of the License, or (at your option) any later version.
|
|
*
|
|
* PSync is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY;
|
|
* without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR
|
|
* PURPOSE. See the GNU Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public License along with
|
|
* PSync, e.g., in COPYING.md file. If not, see <http://www.gnu.org/licenses/>.
|
|
*
|
|
|
|
* This file incorporates work covered by the following copyright and
|
|
* permission notice:
|
|
|
|
* The MIT License (MIT)
|
|
|
|
* Copyright (c) 2014 Gavin Andresen
|
|
|
|
* Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
* of this software and associated documentation files (the "Software"), to deal
|
|
* in the Software without restriction, including without limitation the rights
|
|
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
* copies of the Software, and to permit persons to whom the Software is
|
|
* furnished to do so, subject to the following conditions:
|
|
|
|
* The above copyright notice and this permission notice shall be included in all
|
|
* copies or substantial portions of the Software.
|
|
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
* SOFTWARE.
|
|
*/
|
|
|
|
#include "PSync/detail/iblt.hpp"
|
|
#include "PSync/detail/util.hpp"
|
|
|
|
#include <boost/iostreams/device/array.hpp>
|
|
#include <boost/iostreams/filtering_stream.hpp>
|
|
#include <boost/iostreams/filter/zlib.hpp>
|
|
#include <boost/iostreams/copy.hpp>
|
|
|
|
namespace psync {
|
|
|
|
namespace bio = boost::iostreams;
|
|
|
|
const size_t N_HASH(3);
|
|
const size_t N_HASHCHECK(11);
|
|
|
|
bool
|
|
HashTableEntry::isPure() const
|
|
{
|
|
if (count == 1 || count == -1) {
|
|
uint32_t check = murmurHash3(N_HASHCHECK, keySum);
|
|
return keyCheck == check;
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
bool
|
|
HashTableEntry::isEmpty() const
|
|
{
|
|
return count == 0 && keySum == 0 && keyCheck == 0;
|
|
}
|
|
|
|
IBLT::IBLT(size_t expectedNumEntries)
|
|
{
|
|
// 1.5x expectedNumEntries gives very low probability of decoding failure
|
|
size_t nEntries = expectedNumEntries + expectedNumEntries / 2;
|
|
// make nEntries exactly divisible by N_HASH
|
|
size_t remainder = nEntries % N_HASH;
|
|
if (remainder != 0) {
|
|
nEntries += (N_HASH - remainder);
|
|
}
|
|
|
|
m_hashTable.resize(nEntries);
|
|
}
|
|
|
|
void
|
|
IBLT::initialize(const ndn::name::Component& ibltName)
|
|
{
|
|
const auto& values = extractValueFromName(ibltName);
|
|
|
|
if (3 * m_hashTable.size() != values.size()) {
|
|
BOOST_THROW_EXCEPTION(Error("Received IBF cannot be decoded!"));
|
|
}
|
|
|
|
for (size_t i = 0; i < m_hashTable.size(); i++) {
|
|
HashTableEntry& entry = m_hashTable.at(i);
|
|
if (values[i * 3] != 0) {
|
|
entry.count = values[i * 3];
|
|
entry.keySum = values[(i * 3) + 1];
|
|
entry.keyCheck = values[(i * 3) + 2];
|
|
}
|
|
}
|
|
}
|
|
|
|
void
|
|
IBLT::update(int plusOrMinus, uint32_t key)
|
|
{
|
|
size_t bucketsPerHash = m_hashTable.size() / N_HASH;
|
|
|
|
for (size_t i = 0; i < N_HASH; i++) {
|
|
size_t startEntry = i * bucketsPerHash;
|
|
uint32_t h = murmurHash3(i, key);
|
|
HashTableEntry& entry = m_hashTable.at(startEntry + (h % bucketsPerHash));
|
|
entry.count += plusOrMinus;
|
|
entry.keySum ^= key;
|
|
entry.keyCheck ^= murmurHash3(N_HASHCHECK, key);
|
|
}
|
|
}
|
|
|
|
void
|
|
IBLT::insert(uint32_t key)
|
|
{
|
|
update(INSERT, key);
|
|
}
|
|
|
|
void
|
|
IBLT::erase(uint32_t key)
|
|
{
|
|
update(ERASE, key);
|
|
}
|
|
|
|
bool
|
|
IBLT::listEntries(std::set<uint32_t>& positive, std::set<uint32_t>& negative) const
|
|
{
|
|
IBLT peeled = *this;
|
|
|
|
size_t nErased = 0;
|
|
do {
|
|
nErased = 0;
|
|
for (const auto& entry : peeled.m_hashTable) {
|
|
if (entry.isPure()) {
|
|
if (entry.count == 1) {
|
|
positive.insert(entry.keySum);
|
|
}
|
|
else {
|
|
negative.insert(entry.keySum);
|
|
}
|
|
peeled.update(-entry.count, entry.keySum);
|
|
++nErased;
|
|
}
|
|
}
|
|
} while (nErased > 0);
|
|
|
|
// If any buckets for one of the hash functions is not empty,
|
|
// then we didn't peel them all:
|
|
for (const auto& entry : peeled.m_hashTable) {
|
|
if (entry.isEmpty() != true) {
|
|
return false;
|
|
}
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
IBLT
|
|
IBLT::operator-(const IBLT& other) const
|
|
{
|
|
BOOST_ASSERT(m_hashTable.size() == other.m_hashTable.size());
|
|
|
|
IBLT result(*this);
|
|
for (size_t i = 0; i < m_hashTable.size(); i++) {
|
|
HashTableEntry& e1 = result.m_hashTable.at(i);
|
|
const HashTableEntry& e2 = other.m_hashTable.at(i);
|
|
e1.count -= e2.count;
|
|
e1.keySum ^= e2.keySum;
|
|
e1.keyCheck ^= e2.keyCheck;
|
|
}
|
|
|
|
return result;
|
|
}
|
|
|
|
bool
|
|
operator==(const IBLT& iblt1, const IBLT& iblt2)
|
|
{
|
|
auto iblt1HashTable = iblt1.getHashTable();
|
|
auto iblt2HashTable = iblt2.getHashTable();
|
|
if (iblt1HashTable.size() != iblt2HashTable.size()) {
|
|
return false;
|
|
}
|
|
|
|
size_t N = iblt1HashTable.size();
|
|
|
|
for (size_t i = 0; i < N; i++) {
|
|
if (iblt1HashTable[i].count != iblt2HashTable[i].count ||
|
|
iblt1HashTable[i].keySum != iblt2HashTable[i].keySum ||
|
|
iblt1HashTable[i].keyCheck != iblt2HashTable[i].keyCheck)
|
|
return false;
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
bool
|
|
operator!=(const IBLT& iblt1, const IBLT& iblt2)
|
|
{
|
|
return !(iblt1 == iblt2);
|
|
}
|
|
|
|
std::ostream&
|
|
operator<<(std::ostream& out, const IBLT& iblt)
|
|
{
|
|
out << "count keySum keyCheckMatch\n";
|
|
for (const auto& entry : iblt.getHashTable()) {
|
|
out << entry.count << " " << entry.keySum << " ";
|
|
out << ((murmurHash3(N_HASHCHECK, entry.keySum) == entry.keyCheck) ||
|
|
(entry.isEmpty())? "true" : "false");
|
|
out << "\n";
|
|
}
|
|
|
|
return out;
|
|
}
|
|
|
|
void
|
|
IBLT::appendToName(ndn::Name& name) const
|
|
{
|
|
size_t n = m_hashTable.size();
|
|
size_t unitSize = (32 * 3) / 8; // hard coding
|
|
size_t tableSize = unitSize * n;
|
|
|
|
std::vector<char> table(tableSize);
|
|
|
|
for (size_t i = 0; i < n; i++) {
|
|
// table[i*12], table[i*12+1], table[i*12+2], table[i*12+3] --> hashTable[i].count
|
|
|
|
table[(i * unitSize)] = 0xFF & m_hashTable[i].count;
|
|
table[(i * unitSize) + 1] = 0xFF & (m_hashTable[i].count >> 8);
|
|
table[(i * unitSize) + 2] = 0xFF & (m_hashTable[i].count >> 16);
|
|
table[(i * unitSize) + 3] = 0xFF & (m_hashTable[i].count >> 24);
|
|
|
|
// table[i*12+4], table[i*12+5], table[i*12+6], table[i*12+7] --> hashTable[i].keySum
|
|
|
|
table[(i * unitSize) + 4] = 0xFF & m_hashTable[i].keySum;
|
|
table[(i * unitSize) + 5] = 0xFF & (m_hashTable[i].keySum >> 8);
|
|
table[(i * unitSize) + 6] = 0xFF & (m_hashTable[i].keySum >> 16);
|
|
table[(i * unitSize) + 7] = 0xFF & (m_hashTable[i].keySum >> 24);
|
|
|
|
// table[i*12+8], table[i*12+9], table[i*12+10], table[i*12+11] --> hashTable[i].keyCheck
|
|
|
|
table[(i * unitSize) + 8] = 0xFF & m_hashTable[i].keyCheck;
|
|
table[(i * unitSize) + 9] = 0xFF & (m_hashTable[i].keyCheck >> 8);
|
|
table[(i * unitSize) + 10] = 0xFF & (m_hashTable[i].keyCheck >> 16);
|
|
table[(i * unitSize) + 11] = 0xFF & (m_hashTable[i].keyCheck >> 24);
|
|
}
|
|
|
|
bio::filtering_streambuf<bio::input> in;
|
|
in.push(bio::zlib_compressor());
|
|
in.push(bio::array_source(table.data(), table.size()));
|
|
|
|
std::stringstream sstream;
|
|
bio::copy(in, sstream);
|
|
|
|
std::string compressedIBF = sstream.str();
|
|
name.append(compressedIBF.begin(), compressedIBF.end());
|
|
}
|
|
|
|
std::vector<uint32_t>
|
|
IBLT::extractValueFromName(const ndn::name::Component& ibltName) const
|
|
{
|
|
std::string compressed(ibltName.value_begin(), ibltName.value_end());
|
|
|
|
bio::filtering_streambuf<bio::input> in;
|
|
in.push(bio::zlib_decompressor());
|
|
in.push(bio::array_source(compressed.data(), compressed.size()));
|
|
|
|
std::stringstream sstream;
|
|
bio::copy(in, sstream);
|
|
std::string ibltStr = sstream.str();
|
|
|
|
std::vector<uint8_t> ibltValues(ibltStr.begin(), ibltStr.end());
|
|
size_t n = ibltValues.size() / 4;
|
|
|
|
std::vector<uint32_t> values(n, 0);
|
|
|
|
for (size_t i = 0; i < 4 * n; i += 4) {
|
|
uint32_t t = (ibltValues[i + 3] << 24) +
|
|
(ibltValues[i + 2] << 16) +
|
|
(ibltValues[i + 1] << 8) +
|
|
ibltValues[i];
|
|
values[i / 4] = t;
|
|
}
|
|
|
|
return values;
|
|
}
|
|
|
|
} // namespace psync
|