foedus_code/hash__tmpbin_8cpp_source.html

 /*

  * Copyright (c) 2014-2015, Hewlett-Packard Development Company, LP.

  * This program is free software; you can redistribute it and/or modify it

  * under the terms of the GNU General Public License as published by the Free

  * Software Foundation; either version 2 of the License, or (at your option)

  * any later version.

  *

  * This program is distributed in the hope that it will be useful, but WITHOUT

  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or

  * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for

  * more details. You should have received a copy of the GNU General Public

  * License along with this program; if not, write to the Free Software

  * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

  *

  * HP designates this particular file as subject to the "Classpath" exception

  * as provided by HP in the LICENSE.txt file that accompanied this code.

  */

 #include "foedus/storage/hash/hash_tmpbin.hpp"


 #include <glog/logging.h>


 #include <ostream>

 #include <string>


 #include "foedus/assorted/assorted_func.hpp"


 namespace foedus {

 namespace storage {

 namespace hash {


 HashTmpBin::HashTmpBin()

   : memory_(), records_capacity_(0), records_consumed_(0), buckets_(nullptr), records_(nullptr) {

 }


 ErrorCode HashTmpBin::create_memory(uint16_t numa_node, uint64_t initial_size) {

   ASSERT_ND(initial_size > sizeof(RecordIndex) * kBucketCount);

   ASSERT_ND(sizeof(Record) == kPageSize);

   memory_.alloc(

     initial_size,

     1ULL << 21,

     memory::AlignedMemory::kNumaAllocOnnode,

     numa_node);

   on_memory_set();

   clean();

   return kErrorCodeOk;

 }


 void HashTmpBin::release_memory() {

   memory_.release_block();

   on_memory_set();

   clean();

 }


 void HashTmpBin::steal_memory(memory::AlignedMemory* provider) {

   ASSERT_ND(!provider->is_null());

   memory_ = std::move(*provider);

   ASSERT_ND(provider->is_null());

   ASSERT_ND(!memory_.is_null());

   on_memory_set();

   clean();

 }


 void HashTmpBin::give_memory(memory::AlignedMemory* recipient) {

   ASSERT_ND(!memory_.is_null());

   *recipient = std::move(memory_);

   ASSERT_ND(!recipient->is_null());

   ASSERT_ND(memory_.is_null());

   on_memory_set();

   clean();

 }


 void HashTmpBin::clean() {

   records_consumed_ = get_first_record();

   if (buckets_) {

     std::memset(buckets_, 0, records_consumed_ * sizeof(Record));

   }

 }


 void HashTmpBin::clean_quick() {

   ASSERT_ND(buckets_);

   ASSERT_ND(records_capacity_ > 0);

   ASSERT_ND(records_consumed_ >= get_first_record());

   // at some point, just mem-zero is faster. we could do a switch like below, but it's rare.

   // this also makes unit-testing more tricky.

   // if (records_consumed_ > get_first_record() + 256U) {

   //   clean();

   //   return;

   // }

   for (RecordIndex index = get_first_record(); index < records_consumed_; ++index) {

     Record* record = get_record(index);

     buckets_[extract_bucket(record->hash_)] = 0;

   }

   records_consumed_ = get_first_record();

 }


 void HashTmpBin::on_memory_set() {

   if (memory_.is_null()) {

     buckets_ = nullptr;

     records_ = nullptr;

     records_capacity_ = 0;

   } else {

     buckets_ = reinterpret_cast<RecordIndex*>(memory_.get_block());

     records_ = reinterpret_cast<Record*>(memory_.get_block());

     records_capacity_ = memory_.get_size() / sizeof(Record);

     ASSERT_ND(sizeof(RecordIndex) * kBucketCount % sizeof(Record) == 0);

   }

 }


 inline ErrorCode HashTmpBin::alloc_record(RecordIndex* out) {

   if (UNLIKELY(records_consumed_ == records_capacity_)) {

     // expand memory with keeping the content, which is expensive! this mustn't happen often

     LOG(INFO) << "We need to resize HashTmpBin! current_size=" << memory_.get_size();

     CHECK_ERROR_CODE(memory_.assure_capacity(memory_.get_size() * 2, 2.0, true));

     on_memory_set();

   }


   ASSERT_ND(records_consumed_ < records_capacity_);

   *out = records_consumed_;

   ++records_consumed_;

   return kErrorCodeOk;

 }


 ErrorCode HashTmpBin::insert_record(

   xct::XctId xct_id,

   const void* key,

   uint16_t key_length,

   HashValue hash,

   const void* payload,

   uint16_t payload_length) {

   ASSERT_ND(!xct_id.is_deleted());

   ASSERT_ND(hashinate(key, key_length) == hash);

   SearchResult result = search_bucket(key, key_length, hash);

   if (result.found_ == 0) {

     RecordIndex new_index;

     CHECK_ERROR_CODE(alloc_record(&new_index));

     Record* record = get_record(new_index);

     record->set_all(xct_id, key, key_length, hash, payload, payload_length);


     if (result.tail_ == 0) {

       uint16_t bucket_index = extract_bucket(hash);

       ASSERT_ND(buckets_[bucket_index] == 0);

       buckets_[bucket_index] = new_index;

     } else {

       ASSERT_ND(buckets_[extract_bucket(hash)] != 0);

       Record* tail_record = get_record(result.tail_);

       tail_record->next_ = new_index;

     }

   } else {

     Record* record = get_record(result.found_);

     ASSERT_ND(record->hash_ == hash);

     if (UNLIKELY(!record->xct_id_.is_deleted())) {

       DLOG(WARNING) << "HashTmpBin::insert_record() hit KeyAlreadyExists case. This must not"

         << " happen except unit testcases.";

       return kErrorCodeStrKeyAlreadyExists;

     }

     ASSERT_ND(record->xct_id_.compare_epoch_and_orginal(xct_id) < 0);

     record->xct_id_ = xct_id;

     record->set_payload(payload, payload_length);

   }


   return kErrorCodeOk;

 }


 ErrorCode HashTmpBin::delete_record(

   xct::XctId xct_id,

   const void* key,

   uint16_t key_length,

   HashValue hash) {

   ASSERT_ND(xct_id.is_deleted());

   ASSERT_ND(hashinate(key, key_length) == hash);

   SearchResult result = search_bucket(key, key_length, hash);

   if (UNLIKELY(result.found_ == 0)) {

     DLOG(WARNING) << "HashTmpBin::delete_record() hit KeyNotFound case 1. This must not"

       << " happen except unit testcases.";

     return kErrorCodeStrKeyNotFound;

   } else {

     Record* record = get_record(result.found_);

     ASSERT_ND(record->hash_ == hash);

     if (UNLIKELY(record->xct_id_.is_deleted())) {

       DLOG(WARNING) << "HashTmpBin::delete_record() hit KeyNotFound case 2. This must not"

         << " happen except unit testcases.";

       return kErrorCodeStrKeyNotFound;

     }

     ASSERT_ND(record->xct_id_.compare_epoch_and_orginal(xct_id) < 0);

     record->xct_id_ = xct_id;

   }


   return kErrorCodeOk;

 }


 ErrorCode HashTmpBin::overwrite_record(

   xct::XctId xct_id,

   const void* key,

   uint16_t key_length,

   HashValue hash,

   const void* payload,

   uint16_t payload_offset,

   uint16_t payload_count) {

   ASSERT_ND(!xct_id.is_deleted());

   ASSERT_ND(hashinate(key, key_length) == hash);

   SearchResult result = search_bucket(key, key_length, hash);

   if (UNLIKELY(result.found_ == 0)) {

     DLOG(WARNING) << "HashTmpBin::overwrite_record() hit KeyNotFound case 1. This must not"

       << " happen except unit testcases.";

     return kErrorCodeStrKeyNotFound;

   } else {

     Record* record = get_record(result.found_);

     ASSERT_ND(record->hash_ == hash);

     if (UNLIKELY(record->xct_id_.is_deleted())) {

       DLOG(WARNING) << "HashTmpBin::overwrite_record() hit KeyNotFound case 2. This must not"

         << " happen except unit testcases.";

       return kErrorCodeStrKeyNotFound;

     } else if (UNLIKELY(record->payload_length_ < payload_offset + payload_count)) {

       DLOG(WARNING) << "HashTmpBin::overwrite_record() hit TooShortPayload case. This must not"

         << " happen except unit testcases.";

       return kErrorCodeStrTooShortPayload;

     }

     ASSERT_ND(record->xct_id_.compare_epoch_and_orginal(xct_id) < 0);

     record->xct_id_ = xct_id;

     record->overwrite_payload(payload, payload_offset, payload_count);

   }


   return kErrorCodeOk;

 }


 ErrorCode HashTmpBin::update_record(

   xct::XctId xct_id,

   const void* key,

   uint16_t key_length,

   HashValue hash,

   const void* payload,

   uint16_t payload_length) {

   ASSERT_ND(!xct_id.is_deleted());

   ASSERT_ND(hashinate(key, key_length) == hash);

   SearchResult result = search_bucket(key, key_length, hash);

   if (UNLIKELY(result.found_ == 0)) {

     DLOG(WARNING) << "HashTmpBin::update_record() hit KeyNotFound case 1. This must not"

       << " happen except unit testcases.";

     return kErrorCodeStrKeyNotFound;

   } else {

     Record* record = get_record(result.found_);

     ASSERT_ND(record->hash_ == hash);

     if (UNLIKELY(record->xct_id_.is_deleted())) {

       DLOG(WARNING) << "HashTmpBin::update_record() hit KeyNotFound case 2. This must not"

         << " happen except unit testcases.";

       return kErrorCodeStrKeyNotFound;

     }

     ASSERT_ND(record->xct_id_.compare_epoch_and_orginal(xct_id) < 0);

     record->xct_id_ = xct_id;

     record->set_payload(payload, payload_length);

   }


   return kErrorCodeOk;

 }


 inline HashTmpBin::SearchResult HashTmpBin::search_bucket(

   const void* key,

   uint16_t key_length,

   HashValue hash) const {

   uint16_t bucket_index = extract_bucket(hash);

   RecordIndex head = buckets_[bucket_index];

   if (head == 0) {

     return SearchResult(0, 0);

   }


   ASSERT_ND(head > 0);

   RecordIndex last_seen = 0;

   for (RecordIndex cur = head; cur != 0;) {

     Record* record = get_record(cur);

     if (record->hash_ == hash && record->key_length_ == key_length) {

       if (LIKELY(std::memcmp(record->get_key(), key, key_length) == 0)) {

         return SearchResult(cur, 0);

       }

     }


     last_seen = cur;

     cur = record->next_;

   }


   return SearchResult(0, last_seen);

 }


 std::ostream& operator<<(std::ostream& o, const HashTmpBin& v) {

   // Each bin shouldn't have that many records... so, output everything!

   o << "<HashTmpBin>" << std::endl;

   o << "  " << v.memory_ << std::endl;

   o << "  <records_capacity_>" << v.records_capacity_ << "</records_capacity_>" << std::endl;

   o << "  <records_consumed_>" << v.records_consumed_ << "</records_consumed_>" << std::endl;

   o << "  <buckets_>" << std::endl;

   for (uint32_t i = 0; i < HashTmpBin::kBucketCount; ++i) {

     if (v.buckets_[i] != 0) {

       o << "    <bucket idx=\"" << i << "\" head_rec=\"" << v.buckets_[i] << "\" />" << std::endl;

     }

   }

   o << "  </buckets_>" << std::endl;

   o << "  <records_>" << std::endl;

   uint32_t begin = v.get_first_record();

   for (uint32_t i = begin; i < v.get_records_consumed(); ++i) {

     HashTmpBin::Record* record = v.get_record(i);

     o << "    <record id=\"" << i << "\" hash=\"" << assorted::Hex(record->hash_, 16) << "\"";

     if (record->next_) {

       o << " next_rec=\"" << record->next_ << "\"";

     }

     o << ">";

     o << "<key>" << assorted::HexString(std::string(record->get_key(), record->key_length_))

       << "</key>";

     o << "<payload>"

       << assorted::HexString(std::string(record->get_payload(), record->payload_length_))

       << "</payload>";

     o << record->xct_id_;

     o << "</record>" << std::endl;

   }

   o << "  </records_>" << std::endl;

   o << "</HashTmpBin>";

   return o;

 }


 }  // namespace hash

 }  // namespace storage

 }  // namespace foedus

assorted_func.hpp

foedus::kErrorCodeStrTooShortPayload
0x080A : "STORAGE: The record's payload is smaller than requested" .
Definition: error_code.hpp:176

foedus::storage::Record
Represents one record in our key-value store.
Definition: record.hpp:33

foedus::memory::AlignedMemory::kNumaAllocOnnode
numa_alloc_onnode() and numa_free().
Definition: aligned_memory.hpp:83

foedus::kErrorCodeStrKeyNotFound
0x080C : "STORAGE: This key is not found in this storage" .
Definition: error_code.hpp:178

foedus::storage::hash::HashTmpBin::create_memory
ErrorCode create_memory(uint16_t numa_node, uint64_t initial_size=kDefaultInitialSize)
Allocates the memory to use by this object.
Definition: hash_tmpbin.cpp:36

foedus::memory::AlignedMemory::release_block
void release_block()
Releases the memory block.
Definition: aligned_memory.cpp:235

foedus
Root package of FOEDUS (Fast Optimistic Engine for Data Unification Services).
Definition: assert_nd.hpp:44

foedus::storage::hash::HashTmpBin::RecordIndex
uint32_t RecordIndex
Pointer to Record.
Definition: hash_tmpbin.hpp:69

foedus::storage::hash::HashTmpBin::clean
void clean()
Removes all tuple data for the current bin.
Definition: hash_tmpbin.cpp:74

foedus::storage::hash::HashTmpBin::update_record
ErrorCode update_record(xct::XctId xct_id, const void *key, uint16_t key_length, HashValue hash, const void *payload, uint16_t payload_length)
Updates a record of the given key with the given payload, which might change length.
Definition: hash_tmpbin.cpp:229

foedus::storage::hash::HashTmpBin::Record::set_all
void set_all(xct::XctId xct_id, const void *key, uint16_t key_length, HashValue hash, const void *payload, uint16_t payload_length) __attribute__((always_inline))
Definition: hash_tmpbin.hpp:97

foedus::storage::hash::HashTmpBin::steal_memory
void steal_memory(memory::AlignedMemory *provider)
This is a special version of create_memory() where this object steals the memory ownership from the r...
Definition: hash_tmpbin.cpp:55

foedus::storage::hash::HashTmpBin
An in-memory single-threaded data structure to compose tuples in a hash bin.
Definition: hash_tmpbin.hpp:54

foedus::xct::XctId
Persistent status part of Transaction ID.
Definition: xct_id.hpp:955

foedus::memory::AlignedMemory::assure_capacity
ErrorCode assure_capacity(uint64_t required_size, double expand_margin=2.0, bool retain_content=false) noexcept
If the current size is smaller than the given size, automatically expands.
Definition: aligned_memory.cpp:182

foedus::storage::hash::HashTmpBin::clean_quick
void clean_quick()
This version selectively clears buckets_ by seeing individual records.
Definition: hash_tmpbin.cpp:81

foedus::memory::AlignedMemory::alloc
void alloc(uint64_t size, uint64_t alignment, AllocType alloc_type, int numa_node) noexcept
Allocate a memory, releasing the current memory if exists.
Definition: aligned_memory.cpp:113

LIKELY
#define LIKELY(x)
Hints that x is highly likely true.
Definition: compiler.hpp:103

foedus::storage::hash::HashTmpBin::Record::hash_
HashValue hash_
Definition: hash_tmpbin.hpp:84

foedus::storage::hash::HashTmpBin::HashTmpBin
HashTmpBin()
Constructor doesn't do any initialization.
Definition: hash_tmpbin.cpp:32

foedus::storage::hash::HashTmpBin::Record::xct_id_
xct::XctId xct_id_
Definition: hash_tmpbin.hpp:79

hash_tmpbin.hpp

foedus::storage::hash::HashTmpBin::Record::overwrite_payload
void overwrite_payload(const void *payload, uint16_t payload_offset, uint16_t payload_count) __attribute__((always_inline))
Definition: hash_tmpbin.hpp:133

foedus::kErrorCodeOk
0 means no-error.
Definition: error_code.hpp:87

foedus::storage::hash::hashinate
HashValue hashinate(const void *key, uint16_t key_length)
Calculates hash value for general input.
Definition: hash_hashinate.cpp:31

foedus::storage::hash::operator<<
std::ostream & operator<<(std::ostream &o, const HashCombo &v)
Definition: hash_combo.cpp:37

foedus::storage::hash::HashTmpBin::get_records_consumed
RecordIndex get_records_consumed() const
Definition: hash_tmpbin.hpp:203

foedus::storage::hash::HashTmpBin::Record::get_payload
char * get_payload() __attribute__((always_inline))
Definition: hash_tmpbin.hpp:92

foedus::storage::hash::HashTmpBin::kBucketCount
This is a per-bin data structure.
Definition: hash_tmpbin.hpp:61

foedus::storage::hash::HashTmpBin::Record::get_key
char * get_key() __attribute__((always_inline))
Definition: hash_tmpbin.hpp:91

foedus::storage::hash::HashTmpBin::delete_record
ErrorCode delete_record(xct::XctId xct_id, const void *key, uint16_t key_length, HashValue hash)
Logically deletes a record of the given key.
Definition: hash_tmpbin.cpp:167

foedus::xct::XctId::is_deleted
bool is_deleted() const __attribute__((always_inline))
Definition: xct_id.hpp:1040

foedus::assorted::HexString
Equivalent to std::hex in case the stream doesn't support it.
Definition: assorted_func.hpp:143

foedus::memory::AlignedMemory::get_block
void * get_block() const
Returns the memory block.
Definition: aligned_memory.hpp:168

foedus::storage::hash::HashTmpBin::get_record
Record * get_record(RecordIndex index) const
Definition: hash_tmpbin.hpp:197

foedus::storage::hash::HashTmpBin::Record::set_payload
void set_payload(const void *payload, uint16_t payload_length) __attribute__((always_inline))
Definition: hash_tmpbin.hpp:124

foedus::memory::AlignedMemory::get_size
uint64_t get_size() const
Returns the byte size of the memory block.
Definition: aligned_memory.hpp:172

foedus::storage::hash::HashTmpBin::insert_record
ErrorCode insert_record(xct::XctId xct_id, const void *key, uint16_t key_length, HashValue hash, const void *payload, uint16_t payload_length)
Inserts a new record of the given key and payload.
Definition: hash_tmpbin.cpp:126

CHECK_ERROR_CODE
#define CHECK_ERROR_CODE(x)
This macro calls x and checks its returned error code.
Definition: error_code.hpp:155

foedus::storage::hash::HashTmpBin::overwrite_record
ErrorCode overwrite_record(xct::XctId xct_id, const void *key, uint16_t key_length, HashValue hash, const void *payload, uint16_t payload_offset, uint16_t payload_count)
Overwrites a part of the record of the given key.
Definition: hash_tmpbin.cpp:194

foedus::storage::hash::HashTmpBin::give_memory
void give_memory(memory::AlignedMemory *recipient)
This is a special version of release_memory() where this object moves the memory ownership to the rec...
Definition: hash_tmpbin.cpp:64

foedus::memory::AlignedMemory
Represents one memory block aligned to actual OS/hardware pages.
Definition: aligned_memory.hpp:67

foedus::storage::hash::HashTmpBin::Record::next_
RecordIndex next_
constitutes a singly-linked list in each bucket
Definition: hash_tmpbin.hpp:86

foedus::storage::hash::HashTmpBin::Record
Represents a record with a unique key.
Definition: hash_tmpbin.hpp:78

foedus::assorted::Hex
Convenient way of writing hex integers to stream.
Definition: assorted_func.hpp:124

foedus::storage::hash::HashTmpBin::release_memory
void release_memory()
Destructor automatically releases everything, but you can use this to do it earlier.
Definition: hash_tmpbin.cpp:49

foedus::storage::hash::HashTmpBin::get_first_record
RecordIndex get_first_record() const
Definition: hash_tmpbin.hpp:204

UNLIKELY
#define UNLIKELY(x)
Hints that x is highly likely false.
Definition: compiler.hpp:104

ASSERT_ND
#define ASSERT_ND(x)
A warning-free wrapper macro of assert() that has no performance effect in release mode even when 'x'...
Definition: assert_nd.hpp:72

foedus::storage::hash::HashTmpBin::Record::key_length_
uint16_t key_length_
Definition: hash_tmpbin.hpp:80

foedus::storage::kPageSize
const uint16_t kPageSize
A constant defining the page size (in bytes) of both snapshot pages and volatile pages.
Definition: storage_id.hpp:45

foedus::ErrorCode
ErrorCode
Enum of error codes defined in error_code.xmacro.
Definition: error_code.hpp:85

foedus::xct::XctId::compare_epoch_and_orginal
int compare_epoch_and_orginal(const XctId &other) const __attribute__((always_inline))
Returns -1, 0, 1 when this is less than, same, larger than other in terms of epoch/ordinal.
Definition: xct_id.hpp:993

foedus::kErrorCodeStrKeyAlreadyExists
0x080B : "STORAGE: This key already exists in this storage" .
Definition: error_code.hpp:177

foedus::storage::hash::HashTmpBin::Record::payload_length_
uint16_t payload_length_
Definition: hash_tmpbin.hpp:81

foedus::storage::hash::HashValue
uint64_t HashValue
Represents a full 64-bit hash value calculated from a key.
Definition: hash_id.hpp:129

foedus::memory::AlignedMemory::is_null
bool is_null() const
Returns if this object doesn't hold a valid memory block.
Definition: aligned_memory.hpp:170