foedus_code/shared__memory__repo_8cpp_source.html

 /*

  * Copyright (c) 2014-2015, Hewlett-Packard Development Company, LP.

  * This program is free software; you can redistribute it and/or modify it

  * under the terms of the GNU General Public License as published by the Free

  * Software Foundation; either version 2 of the License, or (at your option)

  * any later version.

  *

  * This program is distributed in the hope that it will be useful, but WITHOUT

  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or

  * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for

  * more details. You should have received a copy of the GNU General Public

  * License along with this program; if not, write to the Free Software

  * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

  *

  * HP designates this particular file as subject to the "Classpath" exception

  * as provided by HP in the LICENSE.txt file that accompanied this code.

  */

 #include "foedus/soc/shared_memory_repo.hpp"


 #include <unistd.h>


 #include <cstring>

 #include <iostream>

 #include <sstream>

 #include <string>

 #include <thread>

 #include <vector>


 #include "foedus/assert_nd.hpp"

 #include "foedus/assorted/assorted_func.hpp"

 #include "foedus/storage/page.hpp"

 #include "foedus/storage/partitioner.hpp"


 namespace foedus {

 namespace soc {


 std::string get_self_path(uint64_t upid, Eid eid) {

   std::string pid_str = std::to_string(upid);

   std::string eid_str = std::to_string(eid);

   return std::string("/tmp/libfoedus_shm_") + pid_str + std::string("_") + eid_str;

 }

 std::string get_master_path(uint64_t master_upid, Eid master_eid) {

   std::string pid_str = std::to_string(master_upid);

   std::string eid_str = std::to_string(master_eid);

   return std::string("/tmp/libfoedus_shm_") + pid_str + std::string("_") + eid_str;

 }


 void NodeMemoryAnchors::allocate_arrays(const EngineOptions& options) {

   deallocate_arrays();

   logger_memories_ = new log::LoggerControlBlock*[options.log_.loggers_per_node_];

   thread_anchors_ = new ThreadMemoryAnchors[options.thread_.thread_count_per_group_];

 }


 void NodeMemoryAnchors::deallocate_arrays() {

   if (logger_memories_) {

     delete[] logger_memories_;

     logger_memories_ = nullptr;

   }

   if (thread_anchors_) {

     delete[] thread_anchors_;

     thread_anchors_ = nullptr;

   }

 }


 uint64_t align_4kb(uint64_t value) { return assorted::align< uint64_t, (1U << 12) >(value); }

 uint64_t align_2mb(uint64_t value) { return assorted::align< uint64_t, (1U << 21) >(value); }


 void SharedMemoryRepo::allocate_one_node(

   uint64_t upid,

   Eid eid,

   uint16_t node,

   uint64_t node_memory_size,

   bool rigorous_memory_boundary_check,

   bool rigorous_page_boundary_check,

   ErrorStack* alloc_result,

   SharedMemoryRepo* repo) {

   // NEVER do COERCE_ERROR here. We must responsibly release shared memory even on errors.

   std::string node_memory_path

     = get_self_path(upid, eid) + std::string("_node_") + std::to_string(node);

   bool use_hugepages = true;

   if (rigorous_memory_boundary_check || rigorous_page_boundary_check) {

     // when mprotect is enabled, we cannot use hugepages

     use_hugepages = false;

   }

   *alloc_result = repo->node_memories_[node].alloc(

     node_memory_path,

     node_memory_size,

     node,

     use_hugepages);

   if (alloc_result->is_error()) {

     repo->node_memories_[node].release_block();

     return;

   }

 }


 ErrorStack SharedMemoryRepo::allocate_shared_memories(

   uint64_t upid,

   Eid eid,

   const EngineOptions& options) {

   deallocate_shared_memories();

   init_empty(options);


   // We place a serialized EngineOptions in the beginning of shared memory.

   std::stringstream options_stream;

   options.save_to_stream(&options_stream);

   std::string xml(options_stream.str());

   uint64_t xml_size = xml.size();


   // construct unique meta files using PID.

   uint64_t global_memory_size = align_2mb(calculate_global_memory_size(xml_size, options));

   std::string global_memory_path = get_self_path(upid, eid) + std::string("_global");

   const bool global_hugepages = !options.memory_.rigorous_memory_boundary_check_;

   CHECK_ERROR(global_memory_.alloc(global_memory_path, global_memory_size, 0, global_hugepages));


   // from now on, be very careful to not exit without releasing this shared memory.


   set_global_memory_anchors(xml_size, options, true);

   global_memory_anchors_.master_status_memory_->status_code_ = MasterEngineStatus::kInitial;


   // copy the EngineOptions string into the beginning of the global memory

   std::memcpy(global_memory_.get_block(), &xml_size, sizeof(xml_size));

   std::memcpy(global_memory_.get_block() + sizeof(xml_size), xml.data(), xml_size);


   // the following is parallelized

   uint64_t node_memory_size = align_2mb(calculate_node_memory_size(options));

   ErrorStack alloc_results[kMaxSocs];

   std::vector< std::thread > alloc_threads;

   for (uint16_t node = 0; node < soc_count_; ++node) {

     alloc_threads.emplace_back(std::thread(

       SharedMemoryRepo::allocate_one_node,

       upid,

       eid,

       node,

       node_memory_size,

       options.memory_.rigorous_memory_boundary_check_,

       options.memory_.rigorous_page_boundary_check_,

       alloc_results + node,

       this));

   }


   ErrorStack last_error;

   bool failed = false;

   for (uint16_t node = 0; node < soc_count_; ++node) {

     alloc_threads[node].join();

     if (alloc_results[node].is_error()) {

       std::cerr << "[FOEDUS] Failed to allocate node shared memory for node-" << node

         << ". " << alloc_results[node] << std::endl;

       last_error = alloc_results[node];

       failed = true;

     }

   }


   if (failed) {

     deallocate_shared_memories();

     return last_error;

   }


   for (uint16_t node = 0; node < soc_count_; ++node) {

     set_node_memory_anchors(node, options, true);

   }


   return kRetOk;

 }


 ErrorStack SharedMemoryRepo::attach_shared_memories(

   uint64_t master_upid,

   Eid master_eid,

   SocId my_soc_id,

   EngineOptions* options) {

   deallocate_shared_memories();


   std::string base = get_master_path(master_upid, master_eid);

   std::string global_memory_path = base + std::string("_global");

   const bool global_hugepages = !options->memory_.rigorous_memory_boundary_check_;

   global_memory_.attach(global_memory_path, global_hugepages);

   if (global_memory_.is_null()) {

     deallocate_shared_memories();

     return ERROR_STACK(kErrorCodeSocShmAttachFailed);

   }


   // read the options from global_memory

   uint64_t xml_size = 0;

   std::memcpy(&xml_size, global_memory_.get_block(), sizeof(xml_size));

   ASSERT_ND(xml_size > 0);

   std::string xml(global_memory_.get_block() + sizeof(xml_size), xml_size);

   CHECK_ERROR(options->load_from_string(xml));


   my_soc_id_ = my_soc_id;

   init_empty(*options);

   set_global_memory_anchors(xml_size, *options, false);


   bool failed = false;

   for (uint16_t node = 0; node < soc_count_; ++node) {

     std::string node_memory_str = base + std::string("_node_") + std::to_string(node);

     node_memories_[node].attach(node_memory_str, !options->memory_.rigorous_memory_boundary_check_);

     if (node_memories_[node].is_null()) {

       failed = true;

     } else {

       set_node_memory_anchors(node, *options, false);

     }

   }


   if (failed) {

     if (!node_memories_[my_soc_id].is_null()) {

       // then we can at least notify the error via the shared memory

       change_child_status(my_soc_id, ChildEngineStatus::kFatalError);

     }

     deallocate_shared_memories();

     return ERROR_STACK(kErrorCodeSocShmAttachFailed);

   }

   return kRetOk;

 }


 void SharedMemoryRepo::mark_for_release() {

   // mark_for_release() is idempotent, so just do it on all of them

   global_memory_.mark_for_release();

   for (uint16_t i = 0; i < soc_count_; ++i) {

     if (node_memories_) {

       node_memories_[i].mark_for_release();

     }

   }

 }

 void SharedMemoryRepo::deallocate_shared_memories() {

   mark_for_release();


   if (!global_memory_.is_null()) {

     if (global_memory_anchors_.protected_boundaries_needs_release_) {

       for (uint32_t i = 0; i < global_memory_anchors_.protected_boundaries_count_; ++i) {

         assorted::ProtectedBoundary* boundary = global_memory_anchors_.protected_boundaries_[i];

         boundary->release_protect();

         boundary->assert_boundary();

       }

     }

   }

   global_memory_anchors_.clear();


   // release_block() is idempotent, so just do it on all of them

   global_memory_.release_block();


   for (uint16_t i = 0; i < soc_count_; ++i) {

     if (node_memories_) {

       if (node_memory_anchors_[i].protected_boundaries_needs_release_) {

         for (uint32_t j = 0; j < node_memory_anchors_[i].protected_boundaries_count_; ++j) {

           assorted::ProtectedBoundary* boundary = node_memory_anchors_[i].protected_boundaries_[j];

           boundary->release_protect();

           boundary->assert_boundary();

         }

       }


       node_memories_[i].release_block();

     }

   }


   if (node_memories_) {

     delete[] node_memories_;

     node_memories_ = nullptr;

   }

   if (node_memory_anchors_) {

     delete[] node_memory_anchors_;

     node_memory_anchors_ = nullptr;

   }

   soc_count_ = 0;

 }


 void SharedMemoryRepo::init_empty(const EngineOptions& options) {

   soc_count_ = options.thread_.group_count_;

   node_memories_ = new memory::SharedMemory[soc_count_];

   node_memory_anchors_ = new NodeMemoryAnchors[soc_count_];

   for (uint16_t node = 0; node < soc_count_; ++node) {

     node_memory_anchors_[node].allocate_arrays(options);

   }

 }


 void SharedMemoryRepo::set_global_memory_anchors(

   uint64_t xml_size,

   const EngineOptions& options,

   bool reset_boundaries) {

   char* base = global_memory_.get_block();

   uint64_t total = 0;

   global_memory_anchors_.options_xml_length_ = xml_size;

   global_memory_anchors_.options_xml_ = base + sizeof(uint64_t);

   total += align_4kb(sizeof(uint64_t) + xml_size);

   put_global_memory_boundary(&total, "options_xml_boundary", reset_boundaries);


   global_memory_anchors_.master_status_memory_

     = reinterpret_cast<MasterEngineStatus*>(base + total);

   total += GlobalMemoryAnchors::kMasterStatusMemorySize;

   put_global_memory_boundary(&total, "master_status_memory_boundary", reset_boundaries);


   global_memory_anchors_.log_manager_memory_

     = reinterpret_cast<log::LogManagerControlBlock*>(base + total);

   total += GlobalMemoryAnchors::kLogManagerMemorySize;

   put_global_memory_boundary(&total, "log_manager_memory_boundary", reset_boundaries);


   global_memory_anchors_.meta_logger_memory_

     = reinterpret_cast<log::MetaLogControlBlock*>(base + total);

   total += GlobalMemoryAnchors::kMetaLoggerSize;

   put_global_memory_boundary(&total, "meta_logger_memory_boundary", reset_boundaries);


   global_memory_anchors_.restart_manager_memory_

     = reinterpret_cast<restart::RestartManagerControlBlock*>(base + total);

   total += GlobalMemoryAnchors::kRestartManagerMemorySize;

   put_global_memory_boundary(&total, "restart_manager_memory_boundary", reset_boundaries);


   global_memory_anchors_.savepoint_manager_memory_

     = reinterpret_cast<savepoint::SavepointManagerControlBlock*>(base + total);

   total += GlobalMemoryAnchors::kSavepointManagerMemorySize;

   put_global_memory_boundary(&total, "savepoint_manager_memory_boundary", reset_boundaries);


   global_memory_anchors_.snapshot_manager_memory_

     = reinterpret_cast<snapshot::SnapshotManagerControlBlock*>(base + total);

   total += GlobalMemoryAnchors::kSnapshotManagerMemorySize;

   put_global_memory_boundary(&total, "snapshot_manager_memory_boundary", reset_boundaries);


   global_memory_anchors_.storage_manager_memory_

     = reinterpret_cast<storage::StorageManagerControlBlock*>(base + total);

   total += GlobalMemoryAnchors::kStorageManagerMemorySize;

   put_global_memory_boundary(&total, "storage_manager_memory_boundary", reset_boundaries);


   global_memory_anchors_.xct_manager_memory_

     = reinterpret_cast<xct::XctManagerControlBlock*>(base + total);

   total += GlobalMemoryAnchors::kXctManagerMemorySize;

   put_global_memory_boundary(&total, "xct_manager_memory_boundary", reset_boundaries);


   global_memory_anchors_.partitioner_metadata_

     = reinterpret_cast<storage::PartitionerMetadata*>(base + total);

   total += align_4kb(sizeof(storage::PartitionerMetadata) * options.storage_.max_storages_);

   put_global_memory_boundary(&total, "partitioner_metadata_boundary", reset_boundaries);

   global_memory_anchors_.partitioner_data_ = base + total;

   total += static_cast<uint64_t>(options.storage_.partitioner_data_memory_mb_) << 20;

   put_global_memory_boundary(&total, "partitioner_data_boundary", reset_boundaries);


   global_memory_anchors_.storage_name_sort_memory_

     = reinterpret_cast<storage::StorageId*>(base + total);

   total += align_4kb(sizeof(storage::StorageId) * options.storage_.max_storages_);

   put_global_memory_boundary(&total, "storage_name_sort_memory_boundary", reset_boundaries);


   global_memory_anchors_.storage_memories_

     = reinterpret_cast<storage::StorageControlBlock*>(base + total);

   total += static_cast<uint64_t>(GlobalMemoryAnchors::kStorageMemorySize)

     * options.storage_.max_storages_;

   put_global_memory_boundary(&total, "storage_memories_boundary", reset_boundaries);


   global_memory_anchors_.user_memory_ = base + total;

   total += align_4kb(1024ULL * options.soc_.shared_user_memory_size_kb_);

   put_global_memory_boundary(&total, "user_memory_boundary", reset_boundaries);


   // we have to be super careful here. let's not use assertion.

   if (calculate_global_memory_size(xml_size, options) != total) {

     std::cerr << "[FOEDUS] global memory size doesn't match. bug?"

       << " allocated=" << calculate_global_memory_size(xml_size, options)

       << ", expected=" << total << std::endl;

   }


   if (options.memory_.rigorous_memory_boundary_check_) {

     // this might mean mprotect() multiple times when SOCs are emulated SOCs.

     // however, acquire_protect() is idempotent, hence it's fine.

     for (assorted::ProtectedBoundary* boundary : global_memory_anchors_.protected_boundaries_) {

       boundary->acquire_protect();

     }

     global_memory_anchors_.protected_boundaries_needs_release_ = true;

   }

 }


 uint64_t SharedMemoryRepo::calculate_global_memory_size(

   uint64_t xml_size,

   const EngineOptions& options) {

   const uint64_t kBoundarySize = sizeof(assorted::ProtectedBoundary);

   uint64_t total = 0;

   total += align_4kb(sizeof(xml_size) + xml_size) + kBoundarySize;  // options_xml_

   total += GlobalMemoryAnchors::kMasterStatusMemorySize + kBoundarySize;

   total += GlobalMemoryAnchors::kLogManagerMemorySize + kBoundarySize;

   total += GlobalMemoryAnchors::kMetaLoggerSize + kBoundarySize;

   total += GlobalMemoryAnchors::kRestartManagerMemorySize + kBoundarySize;

   total += GlobalMemoryAnchors::kSavepointManagerMemorySize + kBoundarySize;

   total += GlobalMemoryAnchors::kSnapshotManagerMemorySize + kBoundarySize;

   total += GlobalMemoryAnchors::kStorageManagerMemorySize + kBoundarySize;

   total += GlobalMemoryAnchors::kXctManagerMemorySize + kBoundarySize;

   total +=

     align_4kb(sizeof(storage::PartitionerMetadata) * options.storage_.max_storages_)

     + kBoundarySize;

   total +=

     (static_cast<uint64_t>(options.storage_.partitioner_data_memory_mb_) << 20)

      + kBoundarySize;

   total +=

     align_4kb(sizeof(storage::StorageId) * options.storage_.max_storages_)

     + kBoundarySize;

   total +=

     static_cast<uint64_t>(GlobalMemoryAnchors::kStorageMemorySize) * options.storage_.max_storages_

     + kBoundarySize;

   total += align_4kb(1024ULL * options.soc_.shared_user_memory_size_kb_) + kBoundarySize;

   return total;

 }


 void SharedMemoryRepo::set_node_memory_anchors(

   SocId node,

   const EngineOptions& options,

   bool reset_boundaries) {

   char* base = node_memories_[node].get_block();

   NodeMemoryAnchors& anchor = node_memory_anchors_[node];

   uint64_t total = 0;

   anchor.child_status_memory_ = reinterpret_cast<ChildEngineStatus*>(base);

   total += NodeMemoryAnchors::kChildStatusMemorySize;

   put_node_memory_boundary(node, &total, "node_child_status_memory_boundary", reset_boundaries);


   anchor.volatile_pool_status_ = reinterpret_cast<memory::PagePoolControlBlock*>(base + total);

   total += NodeMemoryAnchors::kPagePoolMemorySize;

   put_node_memory_boundary(node, &total, "node_volatile_pool_status_boundary", reset_boundaries);


   anchor.proc_manager_memory_ = reinterpret_cast<proc::ProcManagerControlBlock*>(base + total);

   total += NodeMemoryAnchors::kProcManagerMemorySize;

   put_node_memory_boundary(node, &total, "node_proc_manager_memory_boundary", reset_boundaries);


   anchor.proc_memory_ = reinterpret_cast<proc::ProcAndName*>(base + total);

   total += align_4kb(sizeof(proc::ProcAndName) * options.proc_.max_proc_count_);

   put_node_memory_boundary(node, &total, "node_proc_memory_boundary", reset_boundaries);


   anchor.proc_name_sort_memory_ = reinterpret_cast<proc::LocalProcId*>(base + total);

   total += align_4kb(sizeof(proc::LocalProcId) * options.proc_.max_proc_count_);

   put_node_memory_boundary(node, &total, "node_proc_name_sort_memory_boundary", reset_boundaries);


   anchor.log_reducer_memory_ = reinterpret_cast<snapshot::LogReducerControlBlock*>(base + total);

   total += NodeMemoryAnchors::kLogReducerMemorySize;

   put_node_memory_boundary(node, &total, "node_log_reducer_memory_boundary", reset_boundaries);


   anchor.log_reducer_root_info_pages_ = reinterpret_cast<storage::Page*>(base + total);

   total += options.storage_.max_storages_ * 4096ULL;

   put_node_memory_boundary(

     node,

     &total,

     "node_log_reducer_root_info_pages_boundary",

     reset_boundaries);


   for (uint16_t i = 0; i < options.log_.loggers_per_node_; ++i) {

     anchor.logger_memories_[i] = reinterpret_cast<log::LoggerControlBlock*>(base + total);

     total += NodeMemoryAnchors::kLoggerMemorySize;

     put_node_memory_boundary(node, &total, "node_logger_memories_boundary", reset_boundaries);

   }


   for (uint16_t i = 0; i < options.thread_.thread_count_per_group_; ++i) {

     ThreadMemoryAnchors& thread_anchor = anchor.thread_anchors_[i];

     thread_anchor.thread_memory_ = reinterpret_cast<thread::ThreadControlBlock*>(base + total);

     total += ThreadMemoryAnchors::kThreadMemorySize;

     put_node_memory_boundary(node, &total, "thread_memory_boundary", reset_boundaries);


     thread_anchor.task_input_memory_ = base + total;

     total += ThreadMemoryAnchors::kTaskInputMemorySize;

     put_node_memory_boundary(node, &total, "thread_task_input_memory_boundary", reset_boundaries);


     thread_anchor.task_output_memory_ = base + total;

     total += ThreadMemoryAnchors::kTaskOutputMemorySize;

     put_node_memory_boundary(node, &total, "thread_task_output_memory_boundary", reset_boundaries);


     thread_anchor.mcs_ww_lock_memories_ = reinterpret_cast<xct::McsWwBlock*>(base + total);

     total += ThreadMemoryAnchors::kMcsWwLockMemorySize;

     put_node_memory_boundary(node, &total, "thread_mcs_lock_memories_boundary", reset_boundaries);


     thread_anchor.mcs_rw_simple_lock_memories_

       = reinterpret_cast<xct::McsRwSimpleBlock*>(base + total);

     total += ThreadMemoryAnchors::kMcsRwLockMemorySize;

     put_node_memory_boundary(

       node, &total, "thread_mcs_rw_simple_lock_memories_boundary", reset_boundaries);

     thread_anchor.mcs_rw_extended_lock_memories_

       = reinterpret_cast<xct::McsRwExtendedBlock*>(base + total);

     total += ThreadMemoryAnchors::kMcsRwLockMemorySize;

     put_node_memory_boundary(

       node, &total, "thread_mcs_rw_extended_lock_memories_boundary", reset_boundaries);


     thread_anchor.mcs_rw_async_mappings_memories_

       = reinterpret_cast<xct::McsRwAsyncMapping*>(base + total);

     total += ThreadMemoryAnchors::kMcsRwAsyncMappingMemorySize;

     put_node_memory_boundary(

       node, &total, "thread_mcs_rw_async_mappings_memories_boundary", reset_boundaries);

   }


   // This is larger than others (except volatile pool). we place this at the end.

   uint64_t reducer_buffer_size

     = static_cast<uint64_t>(options.snapshot_.log_reducer_buffer_mb_) << 20;

   anchor.log_reducer_buffers_[0] = base + total;

   anchor.log_reducer_buffers_[1] = base + total + (reducer_buffer_size / 2);

   total += reducer_buffer_size;

   put_node_memory_boundary(node, &total, "node_log_reducer_buffers_boundary", reset_boundaries);


   // Then volatile pool at the end. This is even bigger

   anchor.volatile_page_pool_ = base + total;

   total += (static_cast<uint64_t>(options.memory_.page_pool_size_mb_per_node_) << 20);

   put_node_memory_boundary(node, &total, "volatile_pool_boundary", reset_boundaries);


   // we have to be super careful here. let's not use assertion.

   if (total != calculate_node_memory_size(options)) {

     std::cerr << "[FOEDUS] node memory size doesn't match. bug?"

       << " allocated=" << calculate_node_memory_size(options)

       << ", expected=" << total << std::endl;

   }


   // same as global memory

   if (options.memory_.rigorous_memory_boundary_check_) {

     for (assorted::ProtectedBoundary* boundary : anchor.protected_boundaries_) {

       boundary->acquire_protect();

     }

     anchor.protected_boundaries_needs_release_ = true;

   }

 }


 uint64_t SharedMemoryRepo::calculate_node_memory_size(const EngineOptions& options) {

   const uint64_t kBoundarySize = sizeof(assorted::ProtectedBoundary);

   uint64_t total = 0;

   total += NodeMemoryAnchors::kChildStatusMemorySize + kBoundarySize;

   total += NodeMemoryAnchors::kPagePoolMemorySize + kBoundarySize;

   total += NodeMemoryAnchors::kProcManagerMemorySize + kBoundarySize;

   total += align_4kb(sizeof(proc::ProcAndName) * options.proc_.max_proc_count_) + kBoundarySize;

   total += align_4kb(sizeof(proc::LocalProcId) * options.proc_.max_proc_count_) + kBoundarySize;

   total += NodeMemoryAnchors::kLogReducerMemorySize + kBoundarySize;

   total += options.storage_.max_storages_ * 4096ULL + kBoundarySize;


   uint64_t loggers_per_node = options.log_.loggers_per_node_;

   total += loggers_per_node * (NodeMemoryAnchors::kLoggerMemorySize + kBoundarySize);


   uint64_t threads_per_node = options.thread_.thread_count_per_group_;

   total += threads_per_node * (ThreadMemoryAnchors::kThreadMemorySize + kBoundarySize);

   total += threads_per_node * (ThreadMemoryAnchors::kTaskInputMemorySize + kBoundarySize);

   total += threads_per_node * (ThreadMemoryAnchors::kTaskOutputMemorySize + kBoundarySize);

   total += threads_per_node * (ThreadMemoryAnchors::kMcsWwLockMemorySize + kBoundarySize);

   total += threads_per_node * (ThreadMemoryAnchors::kMcsRwLockMemorySize + kBoundarySize);

   total += threads_per_node * (ThreadMemoryAnchors::kMcsRwLockMemorySize + kBoundarySize);

   total += threads_per_node * (ThreadMemoryAnchors::kMcsRwAsyncMappingMemorySize + kBoundarySize);


   total +=

     (static_cast<uint64_t>(options.snapshot_.log_reducer_buffer_mb_) << 20)

     + kBoundarySize;


   // Then volatile pool at the end.

   total +=

     (static_cast<uint64_t>(options.memory_.page_pool_size_mb_per_node_) << 20)

     + kBoundarySize;

   return total;

 }


 void SharedMemoryRepo::change_master_status(MasterEngineStatus::StatusCode new_status) {

   global_memory_anchors_.master_status_memory_->change_status_atomic(new_status);

 }


 MasterEngineStatus::StatusCode SharedMemoryRepo::get_master_status() const {

   return global_memory_anchors_.master_status_memory_->read_status_atomic();

 }


 void SharedMemoryRepo::change_child_status(SocId node, ChildEngineStatus::StatusCode new_status) {

   node_memory_anchors_[node].child_status_memory_->change_status_atomic(new_status);

 }


 ChildEngineStatus::StatusCode SharedMemoryRepo::get_child_status(SocId node) const {

   return node_memory_anchors_[node].child_status_memory_->read_status_atomic();

 }


 }  // namespace soc

 }  // namespace foedus

assorted_func.hpp

foedus::soc::NodeMemoryAnchors::kPagePoolMemorySize
Definition: shared_memory_repo.hpp:316

foedus::soc::ThreadMemoryAnchors::kThreadMemorySize
Definition: shared_memory_repo.hpp:411

foedus::externalize::Externalizable::load_from_string
ErrorStack load_from_string(const std::string &xml)
Load the content of this object from the given XML string.
Definition: externalizable.cpp:38

foedus::soc::NodeMemoryAnchors::protected_boundaries_count_
uint32_t protected_boundaries_count_
To be a POD, we avoid vector and instead uses a fix-sized array.
Definition: shared_memory_repo.hpp:400

foedus::soc::SharedMemoryRepo::allocate_shared_memories
ErrorStack allocate_shared_memories(uint64_t upid, Eid eid, const EngineOptions &options)
Master process creates shared memories by calling this method.
Definition: shared_memory_repo.cpp:96

foedus::externalize::Externalizable::save_to_stream
void save_to_stream(std::ostream *ptr) const
Invokes save() and directs the resulting XML text to the given stream.
Definition: externalizable.cpp:55

foedus::soc::ThreadMemoryAnchors::kTaskInputMemorySize
Definition: shared_memory_repo.hpp:412

foedus::soc::NodeMemoryAnchors::kChildStatusMemorySize
Definition: shared_memory_repo.hpp:315

foedus::kErrorCodeSocShmAttachFailed
0x0C02 : "SOC    : Failed to attach a shared memory." .
Definition: error_code.hpp:221

foedus::soc::GlobalMemoryAnchors::kStorageMemorySize
Definition: shared_memory_repo.hpp:229

shared_memory_repo.hpp

foedus::soc::GlobalMemoryAnchors::options_xml_
char * options_xml_
The xml itself.
Definition: shared_memory_repo.hpp:244

foedus::soc::ThreadMemoryAnchors::kMcsWwLockMemorySize
Definition: shared_memory_repo.hpp:414

foedus::assorted::ProtectedBoundary
A 4kb dummy data placed between separate memory regions so that we can check if/where a bogus memory ...
Definition: protected_boundary.hpp:56

foedus::soc::SharedMemoryRepo::change_master_status
void change_master_status(MasterEngineStatus::StatusCode new_status)
Definition: shared_memory_repo.cpp:539

ERROR_STACK
#define ERROR_STACK(e)
Instantiates ErrorStack with the given foedus::error_code, creating an error stack with the current f...
Definition: error_stack.hpp:480

foedus::soc::GlobalMemoryAnchors::storage_name_sort_memory_
storage::StorageId * storage_name_sort_memory_
This memory stores the ID of storages sorted by their names.
Definition: shared_memory_repo.hpp:282

foedus::storage::StorageId
uint32_t StorageId
Unique ID for storage.
Definition: storage_id.hpp:55

foedus::soc::GlobalMemoryAnchors::options_xml_length_
uint64_t options_xml_length_
The beginning of global memory is an XML-serialized EngineOption.
Definition: shared_memory_repo.hpp:242

foedus
Root package of FOEDUS (Fast Optimistic Engine for Data Unification Services).
Definition: assert_nd.hpp:44

foedus::soc::GlobalMemoryAnchors::partitioner_data_
void * partitioner_data_
Data block to place detailed information of partitioners.
Definition: shared_memory_repo.hpp:276

foedus::soc::NodeMemoryAnchors::proc_name_sort_memory_
proc::LocalProcId * proc_name_sort_memory_
This memory stores the ID of procedures sorted by their names.
Definition: shared_memory_repo.hpp:360

foedus::soc::GlobalMemoryAnchors::log_manager_memory_
log::LogManagerControlBlock * log_manager_memory_
Tiny memory for log manager.
Definition: shared_memory_repo.hpp:253

foedus::soc::ChildEngineStatus::StatusCode
StatusCode
These statuses represent each step described in SocManager comment.
Definition: shared_memory_repo.hpp:147

page.hpp

foedus::soc::NodeMemoryAnchors::logger_memories_
log::LoggerControlBlock ** logger_memories_
Status and synchronization mechanism for loggers on this node.
Definition: shared_memory_repo.hpp:387

foedus::soc::NodeMemoryAnchors::volatile_page_pool_
void * volatile_page_pool_
By far the largest memory for volatile page pool on this node.
Definition: shared_memory_repo.hpp:395

foedus::thread::ThreadControlBlock
Shared data of ThreadPimpl.
Definition: thread_pimpl.hpp:48

foedus::soc::SharedMemoryRepo::deallocate_shared_memories
void deallocate_shared_memories()
Detaches and releases the shared memories.
Definition: shared_memory_repo.cpp:223

foedus::soc::MasterEngineStatus::change_status_atomic
void change_status_atomic(StatusCode new_status)
Update the value of status_code_ with fence.
Definition: shared_memory_repo.hpp:102

foedus::memory::SharedMemory::get_block
char * get_block() const
Returns the memory block.
Definition: shared_memory.hpp:144

foedus::soc::ChildEngineStatus::change_status_atomic
void change_status_atomic(StatusCode new_status)
Update the value of status_code_ with fence.
Definition: shared_memory_repo.hpp:179

foedus::soc::get_self_path
std::string get_self_path(uint64_t upid, Eid eid)
Definition: shared_memory_repo.cpp:37

foedus::soc::align_4kb
uint64_t align_4kb(uint64_t value)
Definition: shared_memory_repo.cpp:65

foedus::soc::NodeMemoryAnchors::kProcManagerMemorySize
Definition: shared_memory_repo.hpp:319

foedus::ErrorStack
Brings error stacktrace information as return value of functions.
Definition: error_stack.hpp:81

foedus::xct::McsRwSimpleBlock
Reader-writer (RW) MCS lock classes.
Definition: xct_id.hpp:387

foedus::soc::GlobalMemoryAnchors::user_memory_
void * user_memory_
This 'user memory' can be used for arbitrary purporses by the user to communicate between SOCs...
Definition: shared_memory_repo.hpp:299

foedus::soc::MasterEngineStatus::read_status_atomic
StatusCode read_status_atomic() const
Read status_code_ with fence.
Definition: shared_memory_repo.hpp:110

foedus::soc::NodeMemoryAnchors
Same as GlobalMemoryAnchors except this is for node_memories_.
Definition: shared_memory_repo.hpp:313

foedus::soc::SharedMemoryRepo::mark_for_release
void mark_for_release()
Marks shared memories as being removed so that it will be reclaimed when all processes detach it...
Definition: shared_memory_repo.cpp:214

foedus::soc::ThreadMemoryAnchors
Part of NodeMemoryAnchors for each thread.
Definition: shared_memory_repo.hpp:409

foedus::soc::align_2mb
uint64_t align_2mb(uint64_t value)
Definition: shared_memory_repo.cpp:66

foedus::EngineOptions::proc_
proc::ProcOptions proc_
Definition: engine_options.hpp:140

foedus::soc::GlobalMemoryAnchors::meta_logger_memory_
log::MetaLogControlBlock * meta_logger_memory_
Tiny memory for metadata logger.
Definition: shared_memory_repo.hpp:255

foedus::memory::MemoryOptions::rigorous_memory_boundary_check_
bool rigorous_memory_boundary_check_
Whether to use mprotect() for memory boundaries to detect bogus memory accesses.
Definition: memory_options.hpp:94

foedus::EngineOptions::soc_
soc::SocOptions soc_
Definition: engine_options.hpp:144

foedus::storage::StorageOptions::max_storages_
uint32_t max_storages_
Maximum number of storages in this database.
Definition: storage_options.hpp:43

foedus::thread::ThreadOptions::thread_count_per_group_
ThreadLocalOrdinal thread_count_per_group_
Number of Thread in each ThreadGroup.
Definition: thread_options.hpp:50

partitioner.hpp

foedus::soc::GlobalMemoryAnchors::storage_memories_
storage::StorageControlBlock * storage_memories_
Status of each storage instance is stored in this shared memory.
Definition: shared_memory_repo.hpp:292

foedus::soc::GlobalMemoryAnchors::kSavepointManagerMemorySize
3 << 19 is for FixedSavepoint.
Definition: shared_memory_repo.hpp:225

foedus::soc::NodeMemoryAnchors::deallocate_arrays
void deallocate_arrays()
Definition: shared_memory_repo.cpp:54

foedus::soc::GlobalMemoryAnchors::kRestartManagerMemorySize
Definition: shared_memory_repo.hpp:223

foedus::memory::SharedMemory
Represents memory shared between processes.
Definition: shared_memory.hpp:92

foedus::soc::NodeMemoryAnchors::proc_manager_memory_
proc::ProcManagerControlBlock * proc_manager_memory_
ProcManagers's status and its synchronization mechanism on this node.
Definition: shared_memory_repo.hpp:350

foedus::soc::GlobalMemoryAnchors::clear
void clear()
Definition: shared_memory_repo.hpp:235

foedus::soc::GlobalMemoryAnchors::storage_manager_memory_
storage::StorageManagerControlBlock * storage_manager_memory_
Tiny memory for storage manager.
Definition: shared_memory_repo.hpp:263

foedus::storage::StorageOptions::partitioner_data_memory_mb_
uint32_t partitioner_data_memory_mb_
Size in MB of a shared memory buffer allocated for all partitioners during log gleaning.
Definition: storage_options.hpp:51

foedus::soc::GlobalMemoryAnchors::protected_boundaries_count_
uint32_t protected_boundaries_count_
To be a POD, we avoid vector and instead uses a fix-sized array.
Definition: shared_memory_repo.hpp:304

foedus::EngineOptions::memory_
memory::MemoryOptions memory_
Definition: engine_options.hpp:139

foedus::soc::GlobalMemoryAnchors::partitioner_metadata_
storage::PartitionerMetadata * partitioner_metadata_
Tiny metadata memory for partitioners.
Definition: shared_memory_repo.hpp:271

foedus::xct::McsWwBlock
Pre-allocated MCS block for WW-locks.
Definition: xct_id.hpp:274

foedus::EngineOptions::storage_
storage::StorageOptions storage_
Definition: engine_options.hpp:145

foedus::soc::SharedMemoryRepo::attach_shared_memories
ErrorStack attach_shared_memories(uint64_t master_upid, Eid master_eid, SocId my_soc_id, EngineOptions *options)
Child processes (emulated or not) set a reference to shared memory and receive the EngnieOption value...
Definition: shared_memory_repo.cpp:165

foedus::soc::SharedMemoryRepo::calculate_global_memory_size
static uint64_t calculate_global_memory_size(uint64_t xml_size, const EngineOptions &options)
Definition: shared_memory_repo.cpp:365

foedus::EngineOptions::snapshot_
snapshot::SnapshotOptions snapshot_
Definition: engine_options.hpp:143

foedus::xct::McsRwExtendedBlock
Pre-allocated MCS block for extended version of RW-locks.
Definition: xct_id.hpp:513

foedus::soc::GlobalMemoryAnchors::kLogManagerMemorySize
Definition: shared_memory_repo.hpp:221

assert_nd.hpp

foedus::snapshot::LogReducerControlBlock
Shared data for LogReducer.
Definition: log_reducer_impl.hpp:159

foedus::soc::ThreadMemoryAnchors::thread_memory_
thread::ThreadControlBlock * thread_memory_
Status and synchronization mechanism for impersonation of this thread.
Definition: shared_memory_repo.hpp:429

foedus::storage::Page
Just a marker to denote that the memory region represents a data page.
Definition: page.hpp:334

foedus::soc::ThreadMemoryAnchors::kMcsRwLockMemorySize
Definition: shared_memory_repo.hpp:415

foedus::proc::ProcAndName
std::pair< ProcName, Proc > ProcAndName
Just a std::pair.
Definition: proc_id.hpp:119

foedus::EngineOptions
Set of option values given to the engine at start-up.
Definition: engine_options.hpp:75

foedus::soc::NodeMemoryAnchors::log_reducer_memory_
snapshot::LogReducerControlBlock * log_reducer_memory_
Tiny control memory for LogReducer in this node.
Definition: shared_memory_repo.hpp:367

foedus::soc::GlobalMemoryAnchors::kMetaLoggerSize
Definition: shared_memory_repo.hpp:222

foedus::soc::ChildEngineStatus
Current status of a child SOC engine.
Definition: shared_memory_repo.hpp:142

foedus::soc::SharedMemoryRepo::calculate_node_memory_size
static uint64_t calculate_node_memory_size(const EngineOptions &options)
Definition: shared_memory_repo.cpp:505

foedus::soc::NodeMemoryAnchors::log_reducer_buffers_
void * log_reducer_buffers_[2]
Actual buffers for LogReducer.
Definition: shared_memory_repo.hpp:373

foedus::soc::get_master_path
std::string get_master_path(uint64_t master_upid, Eid master_eid)
Definition: shared_memory_repo.cpp:42

foedus::thread::ThreadOptions::group_count_
uint16_t group_count_
Number of ThreadGroup in the engine.
Definition: thread_options.hpp:43

foedus::soc::GlobalMemoryAnchors::xct_manager_memory_
xct::XctManagerControlBlock * xct_manager_memory_
Tiny memory for xct manager.
Definition: shared_memory_repo.hpp:265

foedus::log::LoggerControlBlock
Shared data of Logger.
Definition: logger_impl.hpp:51

foedus::soc::GlobalMemoryAnchors::kMasterStatusMemorySize
Definition: shared_memory_repo.hpp:220

foedus::memory::SharedMemory::attach
void attach(const std::string &meta_path, bool use_hugepages)
Attach an already-allocated shared memory so that this object points to the memory.
Definition: shared_memory.cpp:157

foedus::soc::GlobalMemoryAnchors::snapshot_manager_memory_
snapshot::SnapshotManagerControlBlock * snapshot_manager_memory_
Tiny memory for snapshot manager.
Definition: shared_memory_repo.hpp:261

foedus::snapshot::SnapshotOptions::log_reducer_buffer_mb_
uint32_t log_reducer_buffer_mb_
The size in MB of a buffer to store log entries in reducer (partition).
Definition: snapshot_options.hpp:115

foedus::soc::ThreadMemoryAnchors::kTaskOutputMemorySize
Definition: shared_memory_repo.hpp:413

foedus::soc::NodeMemoryAnchors::log_reducer_root_info_pages_
storage::Page * log_reducer_root_info_pages_
This is the 'output' of the reducer in this node.
Definition: shared_memory_repo.hpp:380

foedus::memory::PagePoolControlBlock
Shared data in PagePoolPimpl.
Definition: page_pool_pimpl.hpp:40

foedus::soc::GlobalMemoryAnchors::kStorageManagerMemorySize
Definition: shared_memory_repo.hpp:227

foedus::soc::NodeMemoryAnchors::kLogReducerMemorySize
Definition: shared_memory_repo.hpp:317

foedus::soc::SocId
uint16_t SocId
Represents an ID of an SOC, or NUMA node.
Definition: soc_id.hpp:41

foedus::soc::NodeMemoryAnchors::thread_anchors_
ThreadMemoryAnchors * thread_anchors_
Anchors for each thread.
Definition: shared_memory_repo.hpp:392

foedus::assorted::ProtectedBoundary::assert_boundary
void assert_boundary() const
Called at shutdown to check whether these boundaries were not accessed.
Definition: protected_boundary.hpp:103

foedus::EngineOptions::thread_
thread::ThreadOptions thread_
Definition: engine_options.hpp:146

foedus::storage::PartitionerMetadata
Tiny metadata of partitioner for every storage used while log gleaning.
Definition: partitioner.hpp:209

CHECK_ERROR
#define CHECK_ERROR(x)
This macro calls x and checks its returned value.
Definition: error_stack.hpp:517

foedus::memory::MemoryOptions::page_pool_size_mb_per_node_
uint32_t page_pool_size_mb_per_node_
Size of the page pool in MB per each NUMA node.
Definition: memory_options.hpp:122

foedus::soc::NodeMemoryAnchors::proc_memory_
proc::ProcAndName * proc_memory_
Procedure list on this node.
Definition: shared_memory_repo.hpp:355

foedus::kRetOk
const ErrorStack kRetOk
Normal return value for no-error case.
Definition: error_stack.hpp:251

foedus::soc::GlobalMemoryAnchors::master_status_memory_
MasterEngineStatus * master_status_memory_
This tiny piece of memory contains the current status of the master engine and its synchronization me...
Definition: shared_memory_repo.hpp:250

foedus::proc::ProcManagerControlBlock
This small control block is used to synchronize the access to the array.
Definition: proc_manager_pimpl.hpp:36

foedus::soc::NodeMemoryAnchors::allocate_arrays
void allocate_arrays(const EngineOptions &options)
Definition: shared_memory_repo.cpp:48

foedus::soc::GlobalMemoryAnchors::kSnapshotManagerMemorySize
Definition: shared_memory_repo.hpp:226

foedus::soc::NodeMemoryAnchors::kLoggerMemorySize
Definition: shared_memory_repo.hpp:318

foedus::soc::NodeMemoryAnchors::child_status_memory_
ChildEngineStatus * child_status_memory_
This tiny piece of memory contains the current status of the child engine on this node...
Definition: shared_memory_repo.hpp:338

foedus::soc::GlobalMemoryAnchors::savepoint_manager_memory_
savepoint::SavepointManagerControlBlock * savepoint_manager_memory_
Tiny memory for savepoint manager.
Definition: shared_memory_repo.hpp:259

foedus::proc::LocalProcId
uint32_t LocalProcId
Represents a locally-unique ID of a procedure in one SOC.
Definition: proc_id.hpp:56

foedus::Eid
uint64_t Eid
An Engine ID to differentiate two Engine objects instantiated in the same process.
Definition: engine_type.hpp:29

foedus::proc::ProcOptions::max_proc_count_
uint32_t max_proc_count_
Maximum number of system/user procedures.
Definition: proc_options.hpp:49

foedus::soc::NodeMemoryAnchors::protected_boundaries_
assorted::ProtectedBoundary * protected_boundaries_[kMaxBoundaries]
sanity check boundaries to detect bogus memory accesses that overrun a memory region ...
Definition: shared_memory_repo.hpp:398

foedus::soc::SharedMemoryRepo::change_child_status
void change_child_status(SocId node, ChildEngineStatus::StatusCode new_status)
Definition: shared_memory_repo.cpp:547

ASSERT_ND
#define ASSERT_ND(x)
A warning-free wrapper macro of assert() that has no performance effect in release mode even when 'x'...
Definition: assert_nd.hpp:72

foedus::assorted::ProtectedBoundary::release_protect
ErrorCode release_protect()
Removes all access restrictions via mprotect().
Definition: protected_boundary.cpp:33

foedus::memory::SharedMemory::mark_for_release
void mark_for_release()
Marks the shared memory as being removed so that it will be reclaimed when all processes detach it...
Definition: shared_memory.cpp:213

foedus::soc::GlobalMemoryAnchors::restart_manager_memory_
restart::RestartManagerControlBlock * restart_manager_memory_
Tiny memory for restart manager.
Definition: shared_memory_repo.hpp:257

foedus::soc::ThreadMemoryAnchors::kMcsRwAsyncMappingMemorySize
Definition: shared_memory_repo.hpp:416

foedus::soc::MasterEngineStatus::status_code_
StatusCode status_code_
Definition: shared_memory_repo.hpp:128

foedus::memory::MemoryOptions::rigorous_page_boundary_check_
bool rigorous_page_boundary_check_
Whether to use mprotect() for page boundaries to detect bogus memory accesses.
Definition: memory_options.hpp:114

foedus::memory::SharedMemory::is_null
bool is_null() const
Returns if this object doesn't hold a valid memory block.
Definition: shared_memory.hpp:152

foedus::soc::NodeMemoryAnchors::protected_boundaries_needs_release_
bool protected_boundaries_needs_release_
whether we have invoked mprotect on them
Definition: shared_memory_repo.hpp:402

foedus::soc::ChildEngineStatus::read_status_atomic
StatusCode read_status_atomic() const
Read status_code_ with fence.
Definition: shared_memory_repo.hpp:187

foedus::soc::NodeMemoryAnchors::volatile_pool_status_
memory::PagePoolControlBlock * volatile_pool_status_
PagePool's status and its synchronization mechanism for the volatile pool on this node...
Definition: shared_memory_repo.hpp:344

foedus::EngineOptions::log_
log::LogOptions log_
Definition: engine_options.hpp:138

foedus::soc::SocOptions::shared_user_memory_size_kb_
uint64_t shared_user_memory_size_kb_
As part of the global shared memory, we reserve this size of 'user memory' that can be used for arbit...
Definition: soc_options.hpp:60

foedus::memory::SharedMemory::alloc
ErrorStack alloc(const std::string &meta_path, uint64_t size, int numa_node, bool use_hugepages)
Newly allocate a shared memory of given size on given NUMA node.
Definition: shared_memory.cpp:67

foedus::soc::GlobalMemoryAnchors::protected_boundaries_needs_release_
bool protected_boundaries_needs_release_
whether we have invoked mprotect on them
Definition: shared_memory_repo.hpp:306

foedus::soc::SharedMemoryRepo::get_child_status
ChildEngineStatus::StatusCode get_child_status(SocId node) const
Definition: shared_memory_repo.cpp:551

foedus::soc::GlobalMemoryAnchors::protected_boundaries_
assorted::ProtectedBoundary * protected_boundaries_[kMaxBoundaries]
sanity check boundaries to detect bogus memory accesses that overrun a memory region ...
Definition: shared_memory_repo.hpp:302

foedus::soc::kMaxSocs
const uint16_t kMaxSocs
Maximum number of SOCs.
Definition: soc_id.hpp:35

foedus::memory::SharedMemory::release_block
void release_block()
Releases the memory block IF this process has an ownership.
Definition: shared_memory.cpp:222

foedus::xct::McsRwAsyncMapping
Definition: xct_id.hpp:873

foedus::soc::MasterEngineStatus::StatusCode
StatusCode
These statuses represent each step described in SocManager comment.
Definition: shared_memory_repo.hpp:65

foedus::ErrorStack::is_error
bool is_error() const
Returns if this return code is not kErrorCodeOk.
Definition: error_stack.hpp:385

foedus::soc::MasterEngineStatus::kInitial
Master engine has just started.
Definition: shared_memory_repo.hpp:69

foedus::soc::ChildEngineStatus::kFatalError
The child engine observed some unrecoverable error and has exit.
Definition: shared_memory_repo.hpp:169

foedus::log::LogOptions::loggers_per_node_
uint16_t loggers_per_node_
Number of loggers per NUMA node.
Definition: log_options.hpp:80

foedus::soc::GlobalMemoryAnchors::kXctManagerMemorySize
Definition: shared_memory_repo.hpp:228

foedus::soc::SharedMemoryRepo::get_master_status
MasterEngineStatus::StatusCode get_master_status() const
Definition: shared_memory_repo.cpp:543