docs/master/context_8cpp_source.html

 /*******************************************************************************
  * thrill/api/context.cpp
  *
  * Part of Project Thrill - http://project-thrill.org
  *
  * Copyright (C) 2015 Alexander Noe <[email protected]>
  * Copyright (C) 2015 Timo Bingmann <[email protected]>
  *
  * All rights reserved. Published under the BSD-2 license in the LICENSE file.
  ******************************************************************************/

 #include <thrill/api/context.hpp>

 #include <thrill/api/dia_base.hpp>
 #include <thrill/common/linux_proc_stats.hpp>
 #include <thrill/common/logger.hpp>
 #include <thrill/common/math.hpp>
 #include <thrill/common/porting.hpp>
 #include <thrill/common/profile_thread.hpp>
 #include <thrill/common/string.hpp>
 #include <thrill/common/system_exception.hpp>
 #include <thrill/vfs/file_io.hpp>

 #include <foxxll/io/iostats.hpp>
 #include <foxxll/mng/config.hpp>
 #include <tlx/math/abs_diff.hpp>
 #include <tlx/port/setenv.hpp>
 #include <tlx/string/format_si_iec_units.hpp>
 #include <tlx/string/parse_si_iec_units.hpp>
 #include <tlx/string/split.hpp>

 // mock net backend is always available -tb :)
 #include <thrill/net/mock/group.hpp>

 #if THRILL_HAVE_NET_TCP
 #include <thrill/net/tcp/construct.hpp>
 #include <thrill/net/tcp/select_dispatcher.hpp>
 #endif

 #if THRILL_HAVE_NET_MPI
 #include <thrill/net/mpi/dispatcher.hpp>
 #include <thrill/net/mpi/group.hpp>
 #endif

 #if THRILL_HAVE_NET_IB
 #include <thrill/net/ib/group.hpp>
 #endif

 #if __linux__

 // linux-specific process control
 #include <sys/prctl.h>

 // for calling getrlimit() to determine memory limit
 #include <sys/resource.h>
 #include <sys/time.h>

 #endif

 #if __APPLE__

 // for sysctl()
 #include <sys/sysctl.h>
 #include <sys/types.h>

 #endif

 #if defined(_MSC_VER)

 // for detecting amount of physical memory
 #include <windows.h>

 #endif

 #include <algorithm>
 #include <csignal>
 #include <iostream>
 #include <memory>
 #include <string>
 #include <thread>
 #include <tuple>
 #include <utility>
 #include <vector>

 namespace thrill {
 namespace api {

 /******************************************************************************/
 // Generic Network Construction

 //! Generic network constructor for net backends supporting loopback tests.
 template <typename NetGroup>
 static inline
 std::vector<std::unique_ptr<HostContext> >
 ConstructLoopbackHostContexts(
     const MemoryConfig& mem_config,
     size_t num_hosts, size_t workers_per_host) {

     static constexpr size_t kGroupCount = net::Manager::kGroupCount;

     // construct three full mesh loopback cliques, deliver net::Groups.
     std::array<std::vector<std::unique_ptr<NetGroup> >, kGroupCount> group;

     for (size_t g = 0; g < kGroupCount; ++g) {
         group[g] = NetGroup::ConstructLoopbackMesh(num_hosts);
     }

     std::vector<std::unique_ptr<net::DispatcherThread> > dispatcher;
     for (size_t h = 0; h < num_hosts; ++h) {
         dispatcher.emplace_back(
             std::make_unique<net::DispatcherThread>(
                 std::make_unique<typename NetGroup::Dispatcher>(), h));
     }

     // construct host context

     std::vector<std::unique_ptr<HostContext> > host_context;

     for (size_t h = 0; h < num_hosts; h++) {
         std::array<net::GroupPtr, kGroupCount> host_group = {
             { std::move(group[0][h]), std::move(group[1][h]) }
         };

         host_context.emplace_back(
             std::make_unique<HostContext>(
                 h, mem_config, std::move(dispatcher[h]),
                 std::move(host_group), workers_per_host));
     }

     return host_context;
 }

 //! Generic runner for backends supporting loopback tests.
 template <typename NetGroup>
 static inline void
 RunLoopbackThreads(
     const MemoryConfig& mem_config,
     size_t num_hosts, size_t workers_per_host, size_t core_offset,
     const std::function<void(Context&)>& job_startpoint) {

     MemoryConfig host_mem_config = mem_config.divide(num_hosts);
     mem_config.print(workers_per_host);

     // construct a mock network of hosts
     typename NetGroup::Dispatcher dispatcher;

     std::vector<std::unique_ptr<HostContext> > host_contexts =
         ConstructLoopbackHostContexts<NetGroup>(
             host_mem_config, num_hosts, workers_per_host);

     // launch thread for each of the workers on this host.
     std::vector<std::thread> threads(num_hosts * workers_per_host);

     for (size_t host = 0; host < num_hosts; ++host) {
         std::string log_prefix = "host " + std::to_string(host);
         for (size_t worker = 0; worker < workers_per_host; ++worker) {
             size_t id = host * workers_per_host + worker;
             threads[id] = common::CreateThread(
                 [&host_contexts, &job_startpoint, host, worker, log_prefix] {
                     Context ctx(*host_contexts[host], worker);
                     common::NameThisThread(
                         log_prefix + " worker " + std::to_string(worker));

                     ctx.Launch(job_startpoint);
                 });
             common::SetCpuAffinity(threads[id], core_offset + id);
         }
     }

     // join worker threads
     for (size_t i = 0; i < num_hosts * workers_per_host; i++) {
         threads[i].join();
     }
 }

 /******************************************************************************/
 // Other Configuration Initializations

 static inline bool SetupBlockSize() {

     const char* env_block_size = getenv("THRILL_BLOCK_SIZE");
     if (env_block_size == nullptr || *env_block_size == 0) return true;

     char* endptr;
     data::default_block_size = std::strtoul(env_block_size, &endptr, 10);

     if (endptr == nullptr || *endptr != 0 || data::default_block_size == 0) {
         std::cerr << "Thrill: environment variable"
                   << " THRILL_BLOCK_SIZE=" << env_block_size
                   << " is not a valid number."
                   << std::endl;
         return false;
     }

     data::start_block_size = data::default_block_size;

     std::cerr << "Thrill: setting default_block_size = "
               << data::default_block_size
               << std::endl;

     return true;
 }

 static inline size_t FindWorkersPerHost(
     const char*& str_workers_per_host, const char*& env_workers_per_host) {

     char* endptr;

     // first check THRILL_WORKERS_PER_HOST

     str_workers_per_host = "THRILL_WORKERS_PER_HOST";
     env_workers_per_host = getenv(str_workers_per_host);

     if (env_workers_per_host && *env_workers_per_host) {
         size_t result = std::strtoul(env_workers_per_host, &endptr, 10);
         if (!endptr || *endptr != 0 || result == 0) {
             std::cerr << "Thrill: environment variable"
                       << ' ' << str_workers_per_host
                       << '=' << env_workers_per_host
                       << " is not a valid number of workers per host."
                       << std::endl;
             return 0;
         }
         else {
             return result;
         }
     }

     // second check: look for OMP_NUM_THREADS

     str_workers_per_host = "OMP_NUM_THREADS";
     env_workers_per_host = getenv(str_workers_per_host);

     if (env_workers_per_host && *env_workers_per_host) {
         size_t result = std::strtoul(env_workers_per_host, &endptr, 10);
         if (!endptr || *endptr != 0 || result == 0) {
             std::cerr << "Thrill: environment variable"
                       << ' ' << str_workers_per_host
                       << '=' << env_workers_per_host
                       << " is not a valid number of workers per host."
                       << std::endl;
             // fall through, try next variable
         }
         else {
             return result;
         }
     }

     // third check: look for SLURM_CPUS_ON_NODE

     str_workers_per_host = "SLURM_CPUS_ON_NODE";
     env_workers_per_host = getenv(str_workers_per_host);

     if (env_workers_per_host && *env_workers_per_host) {
         size_t result = std::strtoul(env_workers_per_host, &endptr, 10);
         if (!endptr || *endptr != 0 || result == 0) {
             std::cerr << "Thrill: environment variable"
                       << ' ' << str_workers_per_host
                       << '=' << env_workers_per_host
                       << " is not a valid number of workers per host."
                       << std::endl;
             // fall through, try next variable
         }
         else {
             return result;
         }
     }

     // last check: return std::thread::hardware_concurrency()

     return std::thread::hardware_concurrency();
 }

 static inline bool Initialize() {

     if (!SetupBlockSize()) return false;

     vfs::Initialize();

     return true;
 }

 static inline bool Deinitialize() {

     vfs::Deinitialize();

     return true;
 }

 /******************************************************************************/
 // Constructions using TestGroup (either mock or tcp-loopback) for local testing

 #if defined(_MSC_VER)
 using TestGroup = net::mock::Group;
 #else
 using TestGroup = net::tcp::Group;
 #endif

 void RunLocalMock(const MemoryConfig& mem_config,
                   size_t num_hosts, size_t workers_per_host,
                   const std::function<void(Context&)>& job_startpoint) {

     return RunLoopbackThreads<TestGroup>(
         mem_config, num_hosts, workers_per_host, 0, job_startpoint);
 }

 std::vector<std::unique_ptr<HostContext> >
 HostContext::ConstructLoopback(size_t num_hosts, size_t workers_per_host) {

     // set fixed amount of RAM for testing
     MemoryConfig mem_config;
     mem_config.setup(4 * 1024 * 1024 * 1024llu);
     mem_config.verbose_ = false;

     return ConstructLoopbackHostContexts<TestGroup>(
         mem_config, num_hosts, workers_per_host);
 }

 void RunLocalTests(const std::function<void(Context&)>& job_startpoint) {
     // set fixed amount of RAM for testing
     RunLocalTests(4 * 1024 * 1024 * 1024llu, job_startpoint);
 }

 void RunLocalTests(
     size_t ram, const std::function<void(Context&)>& job_startpoint) {

     // discard json log
     tlx::setenv("THRILL_LOG", "", /* overwrite */ 1);

     // set fixed amount of RAM for testing, disable /proc profiler
     MemoryConfig mem_config;
     mem_config.verbose_ = false;
     mem_config.enable_proc_profiler_ = false;
     mem_config.setup(ram);

     static constexpr size_t num_hosts_list[] = { 1, 2, 5, 8 };
     static constexpr size_t num_workers_list[] = { 1, 3 };

     size_t max_mock_workers = 1000000;

     const char* env_max_mock_workers = getenv("THRILL_MAX_MOCK_WORKERS");
     if (env_max_mock_workers && *env_max_mock_workers) {
         // parse envvar only if it exists.
         char* endptr;
         max_mock_workers = std::strtoul(env_max_mock_workers, &endptr, 10);

         if (!endptr || *endptr != 0 || max_mock_workers == 0) {
             std::cerr << "Thrill: environment variable"
                       << " THRILL_MAX_MOCK_WORKERS=" << env_max_mock_workers
                       << " is not a valid maximum number of mock hosts."
                       << std::endl;
             return;
         }
     }

     for (const size_t& num_hosts : num_hosts_list) {
         for (const size_t& workers_per_host : num_workers_list) {
             if (num_hosts * workers_per_host > max_mock_workers) {
                 std::cerr << "Thrill: skipping test with "
                           << num_hosts * workers_per_host
                           << " workers > max workers " << max_mock_workers
                           << std::endl;
                 continue;
             }

             LOG0 << "Thrill: running local test with "
                  << num_hosts << " hosts and " << workers_per_host
                  << " workers per host";

             RunLocalMock(mem_config, num_hosts, workers_per_host,
                          job_startpoint);
         }
     }
 }

 void RunLocalSameThread(const std::function<void(Context&)>& job_startpoint) {

     size_t my_host_rank = 0;
     size_t workers_per_host = 1;
     size_t num_hosts = 1;
     static constexpr size_t kGroupCount = net::Manager::kGroupCount;

     // set fixed amount of RAM for testing
     MemoryConfig mem_config;
     mem_config.verbose_ = false;
     mem_config.setup(4 * 1024 * 1024 * 1024llu);
     mem_config.print(workers_per_host);

     // construct two full mesh connection cliques, deliver net::tcp::Groups.
     std::array<std::vector<std::unique_ptr<TestGroup> >, kGroupCount> group;

     for (size_t g = 0; g < kGroupCount; ++g) {
         group[g] = TestGroup::ConstructLoopbackMesh(num_hosts);
     }

     std::array<net::GroupPtr, kGroupCount> host_group = {
         { std::move(group[0][0]), std::move(group[1][0]) }
     };

     auto dispatcher = std::make_unique<net::DispatcherThread>(
         std::make_unique<TestGroup::Dispatcher>(), my_host_rank);

     HostContext host_context(
         0, mem_config,
         std::move(dispatcher), std::move(host_group), workers_per_host);

     Context ctx(host_context, 0);
     common::NameThisThread("worker " + std::to_string(my_host_rank));

     job_startpoint(ctx);
 }

 /******************************************************************************/
 // Run() Variants for Different Net Backends

 //! Run() implementation which uses a loopback net backend ("mock" or "tcp").
 template <typename NetGroup>
 static inline
 int RunBackendLoopback(
     const char* backend, const std::function<void(Context&)>& job_startpoint) {

     char* endptr;

     // determine number of loopback hosts

     size_t num_hosts = 2;

     const char* env_local = getenv("THRILL_LOCAL");
     if (env_local && *env_local) {
         // parse envvar only if it exists.
         num_hosts = std::strtoul(env_local, &endptr, 10);

         if (!endptr || *endptr != 0 || num_hosts == 0) {
             std::cerr << "Thrill: environment variable"
                       << " THRILL_LOCAL=" << env_local
                       << " is not a valid number of local loopback hosts."
                       << std::endl;
             return -1;
         }
     }

     // determine number of threads per loopback host

     const char* str_workers_per_host;
     const char* env_workers_per_host;

     size_t workers_per_host = FindWorkersPerHost(
         str_workers_per_host, env_workers_per_host);

     if (workers_per_host == 0)
         return -1;

     // core offset for pinning

     const char* env_core_offset = getenv("THRILL_CORE_OFFSET");
     size_t core_offset = 0;
     if (env_core_offset && *env_core_offset) {
         core_offset = std::strtoul(env_core_offset, &endptr, 10);

         size_t last_core = core_offset + num_hosts * workers_per_host;
         if (!endptr || *endptr != 0 ||
             last_core > std::thread::hardware_concurrency())
         {
             std::cerr << "Thrill: environment variable"
                       << " THRILL_CORE_OFFSET=" << env_core_offset
                       << " is not a valid number of cores to skip for pinning."
                       << std::endl;
             return -1;
         }
     }

     // detect memory config

     MemoryConfig mem_config;
     if (mem_config.setup_detect() < 0) return -1;
     mem_config.print(workers_per_host);

     // okay, configuration is good.

     std::cerr << "Thrill: running locally with " << num_hosts
               << " test hosts and " << workers_per_host << " workers per host"
               << " in a local " << backend << " network." << std::endl;

     if (!Initialize()) return -1;

     RunLoopbackThreads<NetGroup>(
         mem_config, num_hosts, workers_per_host, core_offset, job_startpoint);

     if (!Deinitialize()) return -1;

     return 0;
 }

 #if THRILL_HAVE_NET_TCP
 static inline
 int RunBackendTcp(const std::function<void(Context&)>& job_startpoint) {

     char* endptr;

     // select environment variables

     const char* str_rank = "THRILL_RANK";
     const char* env_rank = getenv(str_rank);

     if (env_rank == nullptr) {
         // take SLURM_PROCID if THRILL_RANK is not set
         str_rank = "SLURM_PROCID";
         env_rank = getenv(str_rank);
     }

     const char* env_hostlist = getenv("THRILL_HOSTLIST");

     // parse environment variables

     size_t my_host_rank = 0;

     if (env_rank != nullptr && *env_rank != 0) {
         my_host_rank = std::strtoul(env_rank, &endptr, 10);

         if (endptr == nullptr || *endptr != 0) {
             std::cerr << "Thrill: environment variable "
                       << str_rank << '=' << env_rank
                       << " is not a valid number."
                       << std::endl;
             return -1;
         }
     }
     else {
         std::cerr << "Thrill: environment variable THRILL_RANK"
                   << " is required for tcp network backend."
                   << std::endl;
         return -1;
     }

     std::vector<std::string> hostlist;

     if (env_hostlist != nullptr && *env_hostlist != 0) {
         // first try to split by spaces, then by commas
         std::vector<std::string> list = tlx::split(' ', env_hostlist);

         if (list.size() == 1) {
             tlx::split(&list, ',', env_hostlist);
         }

         for (const std::string& host : list) {
             // skip empty splits
             if (host.empty()) continue;

             if (host.find(':') == std::string::npos) {
                 std::cerr << "Thrill: invalid address \"" << host << "\""
                           << "in THRILL_HOSTLIST. It must contain a port number."
                           << std::endl;
                 return -1;
             }

             hostlist.push_back(host);
         }

         if (my_host_rank >= hostlist.size()) {
             std::cerr << "Thrill: endpoint list (" << list.size() << " entries) "
                       << "does not include my host_rank (" << my_host_rank << ")"
                       << std::endl;
             return -1;
         }
     }
     else {
         std::cerr << "Thrill: environment variable THRILL_HOSTLIST"
                   << " is required for tcp network backend."
                   << std::endl;
         return -1;
     }

     // determine number of local worker threads per process

     const char* str_workers_per_host;
     const char* env_workers_per_host;

     size_t workers_per_host = FindWorkersPerHost(
         str_workers_per_host, env_workers_per_host);

     if (workers_per_host == 0)
         return -1;

     // detect memory config

     MemoryConfig mem_config;
     if (mem_config.setup_detect() < 0) return -1;
     mem_config.print(workers_per_host);

     // okay, configuration is good.

     std::cerr << "Thrill: running in tcp network with " << hostlist.size()
               << " hosts and " << workers_per_host << " workers per host"
               << " with " << common::GetHostname()
               << " as rank " << my_host_rank << " and endpoints";
     for (const std::string& ep : hostlist)
         std::cerr << ' ' << ep;
     std::cerr << std::endl;

     if (!Initialize()) return -1;

     static constexpr size_t kGroupCount = net::Manager::kGroupCount;

     // construct three TCP network groups
     auto select_dispatcher = std::make_unique<net::tcp::SelectDispatcher>();

     std::array<std::unique_ptr<net::tcp::Group>, kGroupCount> groups;
     net::tcp::Construct(
         *select_dispatcher, my_host_rank, hostlist,
         groups.data(), net::Manager::kGroupCount);

     std::array<net::GroupPtr, kGroupCount> host_groups = {
         { std::move(groups[0]), std::move(groups[1]) }
     };

     // construct HostContext

     auto dispatcher = std::make_unique<net::DispatcherThread>(
         std::move(select_dispatcher), my_host_rank);

     HostContext host_context(
         0, mem_config,
         std::move(dispatcher), std::move(host_groups), workers_per_host);

     std::vector<std::thread> threads(workers_per_host);

     for (size_t worker = 0; worker < workers_per_host; worker++) {
         threads[worker] = common::CreateThread(
             [&host_context, &job_startpoint, worker] {
                 Context ctx(host_context, worker);
                 common::NameThisThread("worker " + std::to_string(worker));

                 ctx.Launch(job_startpoint);
             });
         common::SetCpuAffinity(threads[worker], worker);
     }

     // join worker threads
     for (size_t i = 0; i < workers_per_host; i++) {
         threads[i].join();
     }

     if (!Deinitialize()) return -1;

     return 0;
 }
 #endif

 #if THRILL_HAVE_NET_MPI
 static inline
 int RunBackendMpi(const std::function<void(Context&)>& job_startpoint) {

     // determine number of local worker threads per MPI process

     const char* str_workers_per_host;
     const char* env_workers_per_host;

     size_t workers_per_host = FindWorkersPerHost(
         str_workers_per_host, env_workers_per_host);

     if (workers_per_host == 0)
         return -1;

     // reserve one thread for MPI net::Dispatcher which runs a busy-waiting loop

     if (workers_per_host == 1) {
         std::cerr << "Thrill: environment variable"
                   << ' ' << str_workers_per_host
                   << '=' << env_workers_per_host
                   << " is not recommended, as one thread is used exclusively"
                   << " for MPI communication."
                   << std::endl;
     }
     else {
         --workers_per_host;
     }

     // detect memory config

     MemoryConfig mem_config;
     if (mem_config.setup_detect() < 0) return -1;
     mem_config.print(workers_per_host);

     // okay, configuration is good.

     size_t num_hosts = net::mpi::NumMpiProcesses();
     size_t mpi_rank = net::mpi::MpiRank();
     std::string hostname = common::GetHostname();

     std::cerr << "Thrill: running in MPI network with " << num_hosts
               << " hosts and " << workers_per_host << "+1 workers per host"
               << " with " << hostname << " as rank " << mpi_rank << "."
               << std::endl;

     if (!Initialize()) return -1;

     static constexpr size_t kGroupCount = net::Manager::kGroupCount;

     // construct three MPI network groups
     auto dispatcher = std::make_unique<net::DispatcherThread>(
         std::make_unique<net::mpi::Dispatcher>(num_hosts), mpi_rank);

     std::array<std::unique_ptr<net::mpi::Group>, kGroupCount> groups;
     net::mpi::Construct(num_hosts, *dispatcher, groups.data(), kGroupCount);

     std::array<net::GroupPtr, kGroupCount> host_groups = {
         { std::move(groups[0]), std::move(groups[1]) }
     };

     // construct HostContext
     HostContext host_context(
         0, mem_config,
         std::move(dispatcher), std::move(host_groups), workers_per_host);

     // launch worker threads
     std::vector<std::thread> threads(workers_per_host);

     for (size_t worker = 0; worker < workers_per_host; worker++) {
         threads[worker] = common::CreateThread(
             [&host_context, &job_startpoint, worker] {
                 Context ctx(host_context, worker);
                 common::NameThisThread("host " + std::to_string(ctx.host_rank())
                                        + " worker " + std::to_string(worker));

                 ctx.Launch(job_startpoint);
             });
         common::SetCpuAffinity(threads[worker], worker);
     }

     // join worker threads
     for (size_t i = 0; i < workers_per_host; i++) {
         threads[i].join();
     }

     if (!Deinitialize()) return -1;

     return 0;
 }
 #endif

 #if THRILL_HAVE_NET_IB
 static inline
 int RunBackendIb(const std::function<void(Context&)>& job_startpoint) {

     // determine number of local worker threads per IB/MPI process

     const char* str_workers_per_host;
     const char* env_workers_per_host;

     size_t workers_per_host = FindWorkersPerHost(
         str_workers_per_host, env_workers_per_host);

     if (workers_per_host == 0)
         return -1;

     // detect memory config

     MemoryConfig mem_config;
     if (mem_config.setup_detect() < 0) return -1;
     mem_config.print(workers_per_host);

     // okay, configuration is good.

     size_t num_hosts = net::ib::NumMpiProcesses();
     size_t mpi_rank = net::ib::MpiRank();

     std::cerr << "Thrill: running in IB/MPI network with " << num_hosts
               << " hosts and " << workers_per_host << " workers per host"
               << " with " << common::GetHostname()
               << " as rank " << mpi_rank << "."
               << std::endl;

     if (!Initialize()) return -1;

     static constexpr size_t kGroupCount = net::Manager::kGroupCount;

     // construct two MPI network groups
     std::array<std::unique_ptr<net::ib::Group>, kGroupCount> groups;
     net::ib::Construct(num_hosts, groups.data(), kGroupCount);

     std::array<net::GroupPtr, kGroupCount> host_groups = {
         { std::move(groups[0]), std::move(groups[1]) }
     };

     // construct HostContext
     HostContext host_context(
         0, mem_config, std::move(host_groups), workers_per_host);

     // launch worker threads
     std::vector<std::thread> threads(workers_per_host);

     for (size_t worker = 0; worker < workers_per_host; worker++) {
         threads[worker] = common::CreateThread(
             [&host_context, &job_startpoint, worker] {
                 Context ctx(host_context, worker);
                 common::NameThisThread("host " + std::to_string(ctx.host_rank())
                                        + " worker " + std::to_string(worker));

                 ctx.Launch(job_startpoint);
             });
         common::SetCpuAffinity(threads[worker], worker);
     }

     // join worker threads
     for (size_t i = 0; i < workers_per_host; i++) {
         threads[i].join();
     }

     if (!Deinitialize()) return -1;

     return 0;
 }
 #endif

 int RunNotSupported(const char* env_net) {
     std::cerr << "Thrill: network backend " << env_net
               << " is not supported by this binary." << std::endl;
     return -1;
 }

 static inline
 const char * DetectNetBackend() {
     // detect openmpi and intel mpi run, add others as well.
     if (getenv("OMPI_COMM_WORLD_SIZE") != nullptr ||
         getenv("I_MPI_INFO_NP") != nullptr) {
 #if THRILL_HAVE_NET_IB
         return "ib";
 #elif THRILL_HAVE_NET_MPI
         return "mpi";
 #else
         std::cerr << "Thrill: MPI environment detected, but network backend mpi"
                   << " is not supported by this binary." << std::endl;
         return nullptr;
 #endif
     }
 #if defined(_MSC_VER)
     return "mock";
 #else
     const char* env_rank = getenv("THRILL_RANK");
     const char* env_hostlist = getenv("THRILL_HOSTLIST");

     if (env_rank != nullptr || env_hostlist != nullptr)
         return "tcp";
     else
         return "local";
 #endif
 }

 int RunCheckDieWithParent() {

     const char* env_die_with_parent = getenv("THRILL_DIE_WITH_PARENT");
     if (env_die_with_parent == nullptr || *env_die_with_parent == 0) return 0;

     char* endptr;

     long die_with_parent = std::strtol(env_die_with_parent, &endptr, 10);
     if (endptr == nullptr || *endptr != 0 ||
         (die_with_parent != 0 && die_with_parent != 1)) {
         std::cerr << "Thrill: environment variable"
                   << " THRILL_DIE_WITH_PARENT=" << env_die_with_parent
                   << " is not either 0 or 1."
                   << std::endl;
         return -1;
     }

     if (die_with_parent == 0) return 0;

 #if __linux__
     if (prctl(PR_SET_PDEATHSIG, SIGTERM) != 0) // NOLINT
         throw common::ErrnoException("Error calling prctl(PR_SET_PDEATHSIG)");
     return 1;
 #else
     std::cerr << "Thrill: DIE_WITH_PARENT is not supported on this platform.\n"
               << "Please submit a patch."
               << std::endl;
     return 0;
 #endif
 }

 int RunCheckUnlinkBinary() {

     const char* env_unlink_binary = getenv("THRILL_UNLINK_BINARY");
     if (env_unlink_binary == nullptr || *env_unlink_binary == 0) return 0;

     if (unlink(env_unlink_binary) != 0) {
         throw common::ErrnoException(
                   "Error calling unlink binary \""
                   + std::string(env_unlink_binary) + "\"");
     }

     return 0;
 }

 /*----------------------------------------------------------------------------*/
 // Customized FOXXLL Disk Config

 //! config class to override foxxll's default config
 class FoxxllConfig : public foxxll::config
 {
 public:
     //! override load_default_config()
     void load_default_config() override;

     //! Returns default path of disk.
     std::string default_disk_path() override;

     //! returns the name of the default config file prefix
     std::string default_config_file_name() override;
 };

 void FoxxllConfig::load_default_config() {
     TLX_LOG1 << "foxxll: Using default disk configuration.";
     foxxll::disk_config entry1(
         default_disk_path(), 1000 * 1024 * 1024, default_disk_io_impl());
     entry1.unlink_on_open = true;
     entry1.autogrow = true;
     add_disk(entry1);
 }

 std::string FoxxllConfig::default_disk_path() {
 #if !FOXXLL_WINDOWS
     int pid = getpid();
     return "/var/tmp/thrill." + common::to_str(pid) + ".tmp";
 #else
     DWORD pid = GetCurrentProcessId();
     char* tmpstr = new char[255];
     if (GetTempPathA(255, tmpstr) == 0)
         FOXXLL_THROW_WIN_LASTERROR(resource_error, "GetTempPathA()");
     std::string result = tmpstr;
     result += "thrill." + common::to_str(pid) + ".tmp";
     delete[] tmpstr;
     return result;
 #endif
 }

 std::string FoxxllConfig::default_config_file_name() {
     return ".thrill";
 }

 void RunSetupFoxxll() {
     // install derived config instance in foxxll's singleton
     foxxll::config::create_instance<FoxxllConfig>();
 }

 /*----------------------------------------------------------------------------*/

 int Run(const std::function<void(Context&)>& job_startpoint) {

     common::NameThisThread("main");

     if (RunCheckDieWithParent() < 0)
         return -1;

     if (RunCheckUnlinkBinary() < 0)
         return -1;

     RunSetupFoxxll();

     // parse environment: THRILL_NET
     const char* env_net = getenv("THRILL_NET");

     // if no backend configured: automatically select one.
     if (env_net == nullptr || *env_net == 0) {
         env_net = DetectNetBackend();
         if (env_net == nullptr) return -1;
     }

     // run with selected backend
     if (strcmp(env_net, "mock") == 0) {
         // mock network backend
         return RunBackendLoopback<net::mock::Group>("mock", job_startpoint);
     }

     if (strcmp(env_net, "local") == 0) {
 #if THRILL_HAVE_NET_TCP
         // tcp loopback network backend
         return RunBackendLoopback<net::tcp::Group>("tcp", job_startpoint);
 #else
         return RunNotSupported(env_net);
 #endif
     }

     if (strcmp(env_net, "tcp") == 0) {
 #if THRILL_HAVE_NET_TCP
         // real tcp network backend
         return RunBackendTcp(job_startpoint);
 #else
         return RunNotSupported(env_net);
 #endif
     }

     if (strcmp(env_net, "mpi") == 0) {
 #if THRILL_HAVE_NET_MPI
         // mpi network backend
         return RunBackendMpi(job_startpoint);
 #else
         return RunNotSupported(env_net);
 #endif
     }

     if (strcmp(env_net, "ib") == 0) {
 #if THRILL_HAVE_NET_IB
         // ib/mpi network backend
         return RunBackendIb(job_startpoint);
 #else
         return RunNotSupported(env_net);
 #endif
     }

     std::cerr << "Thrill: network backend " << env_net << " is unknown."
               << std::endl;
     return -1;
 }

 /******************************************************************************/
 // MemoryConfig

 void MemoryConfig::setup(size_t ram) {
     ram_ = ram;
     apply();
 }

 int MemoryConfig::setup_detect() {

     // determine amount of physical RAM or take user's limit

     const char* env_ram = getenv("THRILL_RAM");

     if (env_ram != nullptr && *env_ram != 0) {
         uint64_t ram64;
         if (!tlx::parse_si_iec_units(env_ram, &ram64)) {
             std::cerr << "Thrill: environment variable"
                       << " THRILL_RAM=" << env_ram
                       << " is not a valid amount of RAM memory."
                       << std::endl;
             return -1;
         }
         ram_ = static_cast<size_t>(ram64);
     }
     else {
         // detect amount of physical memory on system
 #if defined(_MSC_VER)
         MEMORYSTATUSEX memstx;
         memstx.dwLength = sizeof(memstx);
         GlobalMemoryStatusEx(&memstx);

         ram_ = memstx.ullTotalPhys;
 #elif __APPLE__
         int mib[2];
         int64_t physical_memory;
         size_t length;

         // Get the physical memory size
         mib[0] = CTL_HW;
         mib[1] = HW_MEMSIZE;
         length = sizeof(physical_memory);
         sysctl(mib, 2, &physical_memory, &length, nullptr, 0);
         ram_ = static_cast<size_t>(physical_memory);
 #else
         ram_ = sysconf(_SC_PHYS_PAGES) * static_cast<size_t>(sysconf(_SC_PAGESIZE));
 #endif

 #if __linux__
         // use getrlimit() to check user limit on address space
         struct rlimit rl; // NOLINT
         if (getrlimit(RLIMIT_AS, &rl) == 0) {
             if (rl.rlim_cur != 0 && rl.rlim_cur * 3 / 4 < ram_) {
                 ram_ = rl.rlim_cur * 3 / 4;
             }
         }
         else {
             sLOG1 << "getrlimit(): " << strerror(errno);
         }
 #endif
     }

     apply();

     return 0;
 }

 void MemoryConfig::apply() {
     // divide up ram_

     ram_workers_ = ram_ / 3;
     ram_block_pool_hard_ = ram_ / 3;
     ram_block_pool_soft_ = ram_block_pool_hard_ * 9 / 10;
     ram_floating_ = ram_ - ram_block_pool_hard_ - ram_workers_;

     // set memory limit, only BlockPool is excluded from malloc tracking, as
     // only it uses bypassing allocators.
     mem::set_memory_limit_indication(ram_floating_ + ram_workers_);
 }

 MemoryConfig MemoryConfig::divide(size_t hosts) const {

     MemoryConfig mc = *this;
     mc.ram_ /= hosts;
     mc.ram_block_pool_hard_ /= hosts;
     mc.ram_block_pool_soft_ /= hosts;
     mc.ram_workers_ /= hosts;
     // free floating memory is not divided by host, as it is measured overall

     return mc;
 }

 void MemoryConfig::print(size_t workers_per_host) const {
     if (!verbose_) return;

     std::cerr
         << "Thrill: using "
         << tlx::format_iec_units(ram_) << "B RAM total,"
         << " BlockPool=" << tlx::format_iec_units(ram_block_pool_hard_) << "B,"
         << " workers="
         << tlx::format_iec_units(ram_workers_ / workers_per_host) << "B,"
         << " floating=" << tlx::format_iec_units(ram_floating_) << "B."
         << std::endl;
 }

 /******************************************************************************/
 // HostContext methods

 HostContext::HostContext(
     size_t local_host_id,
     const MemoryConfig& mem_config,
     std::unique_ptr<net::DispatcherThread> dispatcher,
     std::array<net::GroupPtr, net::Manager::kGroupCount>&& groups,
     size_t workers_per_host)
     : mem_config_(mem_config),
       base_logger_(MakeHostLogPath(groups[0]->my_host_rank())),
       logger_(&base_logger_, "host_rank", groups[0]->my_host_rank()),
       profiler_(std::make_unique<common::ProfileThread>()),
       local_host_id_(local_host_id),
       workers_per_host_(workers_per_host),
       dispatcher_(std::move(dispatcher)),
       net_manager_(std::move(groups), logger_) {

     // write command line parameters to json log
     common::LogCmdlineParams(logger_);

     if (mem_config_.enable_proc_profiler_)
         StartLinuxProcStatsProfiler(*profiler_, logger_);

     // run memory profiler only on local host 0 (especially for test runs)
     if (local_host_id == 0)
         mem::StartMemProfiler(*profiler_, logger_);
 }

 HostContext::~HostContext() {
     // stop dispatcher _before_ stopping multiplexer
     dispatcher_->Terminate();
 }

 std::string HostContext::MakeHostLogPath(size_t host_rank) {
     const char* env_log = getenv("THRILL_LOG");
     if (env_log == nullptr) {
         if (host_rank == 0 && mem_config().verbose_) {
             std::cerr << "Thrill: no THRILL_LOG was found, "
                       << "so no json log is written."
                       << std::endl;
         }
         return std::string();
     }

     std::string output = env_log;
     if (output == "" || output == "-")
         return std::string();
     if (output == "/dev/stdout")
         return output;
     if (output == "stdout")
         return "/dev/stdout";

     return output + "-host-" + std::to_string(host_rank) + ".json";
 }

 /******************************************************************************/
 // Context methods

 Context::Context(HostContext& host_context, size_t local_worker_id)
     : local_host_id_(host_context.local_host_id()),
       local_worker_id_(local_worker_id),
       workers_per_host_(host_context.workers_per_host()),
       mem_limit_(host_context.worker_mem_limit()),
       mem_config_(host_context.mem_config()),
       mem_manager_(host_context.mem_manager()),
       net_manager_(host_context.net_manager()),
       flow_manager_(host_context.flow_manager()),
       block_pool_(host_context.block_pool()),
       multiplexer_(host_context.data_multiplexer()),
       rng_(std::random_device { }
            () + (local_worker_id_ << 16)),
       base_logger_(&host_context.base_logger_) {
     assert(local_worker_id < workers_per_host());
 }

 data::File Context::GetFile(DIABase* dia) {
     return GetFile(dia != nullptr ? dia->dia_id() : 0);
 }

 data::FilePtr Context::GetFilePtr(size_t dia_id) {
     return tlx::make_counting<data::File>(
         block_pool_, local_worker_id_, dia_id);
 }

 data::FilePtr Context::GetFilePtr(DIABase* dia) {
     return GetFilePtr(dia != nullptr ? dia->dia_id() : 0);
 }

 data::CatStreamPtr Context::GetNewCatStream(size_t dia_id) {
     return multiplexer_.GetNewCatStream(local_worker_id_, dia_id);
 }

 data::CatStreamPtr Context::GetNewCatStream(DIABase* dia) {
     return GetNewCatStream(dia != nullptr ? dia->dia_id() : 0);
 }

 data::MixStreamPtr Context::GetNewMixStream(size_t dia_id) {
     return multiplexer_.GetNewMixStream(local_worker_id_, dia_id);
 }

 data::MixStreamPtr Context::GetNewMixStream(DIABase* dia) {
     return GetNewMixStream(dia != nullptr ? dia->dia_id() : 0);
 }

 template <>
 data::CatStreamPtr Context::GetNewStream<data::CatStream>(size_t dia_id) {
     return GetNewCatStream(dia_id);
 }

 template <>
 data::MixStreamPtr Context::GetNewStream<data::MixStream>(size_t dia_id) {
     return GetNewMixStream(dia_id);
 }

 struct OverallStats {

     //! overall run time
     double runtime;

     //! maximum ByteBlock allocation on all workers
     size_t max_block_bytes;

     //! network traffic performed by net layer
     size_t net_traffic_tx, net_traffic_rx;

     //! I/O volume performed by io layer
     size_t io_volume;

     //! maximum external memory allocation
     size_t io_max_allocation;

     friend std::ostream& operator << (std::ostream& os, const OverallStats& c) {
         return os << "[OverallStats"
                   << " runtime=" << c.runtime
                   << " max_block_bytes=" << c.max_block_bytes
                   << " net_traffic_tx=" << c.net_traffic_tx
                   << " net_traffic_rx=" << c.net_traffic_rx
                   << " io_volume=" << c.io_volume
                   << " io_max_allocation=" << c.io_max_allocation
                   << "]";
     }

     OverallStats operator + (const OverallStats& b) const {
         OverallStats r;
         r.runtime = std::max(runtime, b.runtime);
         r.max_block_bytes = max_block_bytes + b.max_block_bytes;
         r.net_traffic_tx = net_traffic_tx + b.net_traffic_tx;
         r.net_traffic_rx = net_traffic_rx + b.net_traffic_rx;
         r.io_volume = io_volume + b.io_volume;
         r.io_max_allocation = std::max(io_max_allocation, b.io_max_allocation);
         return r;
     }
 };

 void Context::Launch(const std::function<void(Context&)>& job_startpoint) {
     logger_ << "class" << "Context"
             << "event" << "job-start";

     common::StatsTimerStart overall_timer;

     try {
         job_startpoint(*this);
     }
     catch (std::exception& e) {
         LOG1 << "worker " << my_rank() << " threw " << typeid(e).name();
         LOG1 << "  what(): " << e.what();

         logger_ << "class" << "Context"
                 << "event" << "job-exception"
                 << "exception" << typeid(e).name()
                 << "what" << e.what();
         throw;
     }

     logger_ << "class" << "Context"
             << "event" << "job-done"
             << "elapsed" << overall_timer;

     overall_timer.Stop();

     // collect overall statistics
     OverallStats stats;
     stats.runtime = overall_timer.SecondsDouble();

     stats.max_block_bytes =
         local_worker_id_ == 0 ? block_pool().max_total_bytes() : 0;

     stats.net_traffic_tx = local_worker_id_ == 0 ? net_manager_.Traffic().tx : 0;
     stats.net_traffic_rx = local_worker_id_ == 0 ? net_manager_.Traffic().rx : 0;

     if (local_host_id_ == 0 && local_worker_id_ == 0) {
         foxxll::stats_data io_stats(*foxxll::stats::get_instance());
         stats.io_volume = io_stats.get_read_bytes() + io_stats.get_write_bytes();
         stats.io_max_allocation =
             foxxll::block_manager::get_instance()->maximum_allocation();
     }
     else {
         stats.io_volume = 0;
         stats.io_max_allocation = 0;
     }

     LOG0 << stats;

     stats = net.Reduce(stats);

     if (my_rank() == 0) {
         using tlx::format_iec_units;

         if (stats.net_traffic_rx != stats.net_traffic_tx)
             LOG1 << "Manager::Traffic() tx/rx asymmetry = "
                  << tlx::abs_diff(stats.net_traffic_tx, stats.net_traffic_rx);

         if (mem_config().verbose_) {
             std::cerr
                 << "Thrill:"
                 << " ran " << stats.runtime << "s with max "
                 << format_iec_units(stats.max_block_bytes) << "B in DIA Blocks, "
                 << format_iec_units(stats.net_traffic_tx) << "B network traffic, "
                 << format_iec_units(stats.io_volume) << "B disk I/O, and "
                 << format_iec_units(stats.io_max_allocation) << "B max disk use."
                 << std::endl;
         }

         logger_ << "class" << "Context"
                 << "event" << "summary"
                 << "runtime" << stats.runtime
                 << "net_traffic" << stats.net_traffic_tx
                 << "io_volume" << stats.io_volume
                 << "io_max_allocation" << stats.io_max_allocation;
     }
 }

 } // namespace api
 } // namespace thrill

 /******************************************************************************/
thrill::common::CreateThread
std::thread CreateThread(Args &&... args)
create a std::thread and repeat creation if it fails
Definition: porting.hpp:44

thrill::data::Multiplexer::GetNewCatStream
CatStreamPtr GetNewCatStream(size_t local_worker_id, size_t dia_id)
Request next stream.
Definition: multiplexer.cpp:195

thrill::api::MemoryConfig::ram_
size_t ram_
total amount of physical ram detected or THRILL_RAM
Definition: context.hpp:63

thrill::api::Context::local_host_id_
size_t local_host_id_
id among all local hosts (in test program runs)
Definition: context.hpp:395

thrill::api::Context::net
net::FlowControlChannel & net
Definition: context.hpp:446

max
static uint_pair max()
return an uint_pair instance containing the largest value possible
Definition: uint_types.hpp:226

system_exception.hpp

setenv.hpp

thrill::api::Context::workers_per_host
size_t workers_per_host() const
Returns the number of workers that is hosted on each host.
Definition: context.hpp:238

thrill::data::BlockPool::max_total_bytes
size_t max_total_bytes() noexcept
Maximum total number of bytes allocated in blocks of this block pool.
Definition: block_pool.cpp:896

config.hpp

thrill::net::mock::Group
The central object of a mock network: the Group containing links to other mock Group forming the netw...
Definition: group.hpp:116

thrill::common::LogCmdlineParams
void LogCmdlineParams(JsonLogger &logger)
Definition: porting.cpp:68

porting.hpp

thrill::api::HostContext::worker_mem_limit
size_t worker_mem_limit() const
memory limit of each worker Context for local data structures
Definition: context.hpp:118

thrill::api::HostContext::HostContext
HostContext(size_t local_host_id, const MemoryConfig &mem_config, std::unique_ptr< net::DispatcherThread > dispatcher, std::array< net::GroupPtr, net::Manager::kGroupCount > &&groups, size_t workers_per_host)
constructor from existing net Groups. Used by the construction methods.
Definition: context.cpp:1123

thrill::mem::StartMemProfiler
void StartMemProfiler(common::ProfileThread &sched, common::JsonLogger &logger)
launch profiler task
Definition: malloc_tracker.cpp:383

select_dispatcher.hpp

thrill::vfs::Initialize
void Initialize()
Initialize VFS layer.
Definition: file_io.cpp:35

thrill::api::Context::net_manager_
net::Manager & net_manager_
net::Manager instance that is shared among workers
Definition: context.hpp:413

thrill::api::HostContext::MakeHostLogPath
std::string MakeHostLogPath(size_t host_rank)
create host log
Definition: context.cpp:1154

LOG1
#define LOG1
Definition: logger.hpp:28

thrill::data::default_block_size
size_t default_block_size
default size of blocks in File, Channel, BlockQueue, etc.
Definition: byte_block.cpp:25

thrill::net::tcp::Group
Collection of NetConnections to workers, allows point-to-point client communication and simple collec...
Definition: group.hpp:43

thrill::data::File
A File is an ordered sequence of Block objects for storing items.
Definition: file.hpp:56

thrill::api::Run
int Run(const std::function< void(Context &)> &job_startpoint)
Runs the given job startpoint with a Context instance.
Definition: context.cpp:947

LOG0
#define LOG0
Override default output: never or always output log.
Definition: logger.hpp:27

thrill::api::Context::mem_config
const MemoryConfig & mem_config() const
host-global memory config
Definition: context.hpp:329

string.hpp

thrill::api::HostContext::net_manager
net::Manager & net_manager()
net manager constructs communication groups to other hosts.
Definition: context.hpp:129

thrill::common::ErrnoException
An Exception which is thrown on system errors and contains errno information.
Definition: system_exception.hpp:36

foxxll::stats_data::get_read_bytes
external_size_type get_read_bytes() const
Definition: iostats.cpp:527

std
STL namespace.

dia_base.hpp

file_io.hpp

thrill::api::HostContext::block_pool
data::BlockPool & block_pool()
the block manager keeps all data blocks moving through the system.
Definition: context.hpp:139

thrill::mem::set_memory_limit_indication
void set_memory_limit_indication(ssize_t size)
Definition: malloc_tracker.cpp:292

thrill::api::HostContext::logger_
common::JsonLogger logger_
Definition: context.hpp:158

logger.hpp

foxxll::disk_config::unlink_on_open
bool unlink_on_open
unlink file immediately after opening (available on most Unix)
Definition: config.hpp:103

thrill::api::HostContext::data_multiplexer
data::Multiplexer & data_multiplexer()
data multiplexer transmits large amounts of data asynchronously.
Definition: context.hpp:142

thrill::api::MemoryConfig::divide
MemoryConfig divide(size_t hosts) const
Definition: context.cpp:1095

thrill::api::RunCheckDieWithParent
int RunCheckDieWithParent()
Check environment variable THRILL_DIE_WITH_PARENT and enable process flag: this is useful for ssh/inv...
Definition: context.cpp:849

thrill::api::Context::operator<<
friend std::ostream & operator<<(std::ostream &os, const Context &ctx)
Outputs the context as [host id]:[local worker id] to an std::ostream.
Definition: context.hpp:272

parse_si_iec_units.hpp

thrill::api::MemoryConfig::setup_detect
int setup_detect()
detect memory configuration from environment
Definition: context.cpp:1023

sLOG1
#define sLOG1
Definition: logger.hpp:38

thrill::api::Context
The Context of a job is a unique instance per worker which holds references to all underlying parts o...
Definition: context.hpp:221

context.hpp

linux_proc_stats.hpp

profile_thread.hpp

dispatcher.hpp

thrill::api::MemoryConfig
Definition: context.hpp:48

thrill::common::NameThisThread
void NameThisThread(const std::string &name)
Defines a name for the current thread, only if no name was set previously.
Definition: logger.cpp:40

thrill::api::DIABase
The DIABase is the untyped super class of DIANode.
Definition: dia_base.hpp:87

thrill::mem::to_string
static by_string to_string(int val)
convert to string
Definition: allocator_base.hpp:191

thrill::api::MemoryConfig::print
void print(size_t workers_per_host) const
Definition: context.cpp:1107

foxxll::block_manager::maximum_allocation
uint64_t maximum_allocation() const
return maximum number of bytes allocated during program run.
Definition: block_manager.cpp:133

thrill::api::Deinitialize
static bool Deinitialize()
Definition: context.cpp:283

foxxll::config
Definition: config.hpp:114

group.hpp

thrill::api::ConstructLoopbackHostContexts
static std::vector< std::unique_ptr< HostContext > > ConstructLoopbackHostContexts(const MemoryConfig &mem_config, size_t num_hosts, size_t workers_per_host)
Generic network constructor for net backends supporting loopback tests.
Definition: context.cpp:95

tlx::split
std::vector< std::string > split(char sep, const std::string &str, std::string::size_type limit)
Split the given string at each separator character into distinct substrings.
Definition: split.cpp:20

thrill::api::RunCheckUnlinkBinary
int RunCheckUnlinkBinary()
Check environment variable THRILL_UNLINK_BINARY and unlink given program path: this is useful for ssh...
Definition: context.cpp:880

thrill::api::Context::block_pool_
data::BlockPool & block_pool_
data block pool
Definition: context.hpp:419

thrill::api::RunLoopbackThreads
static void RunLoopbackThreads(const MemoryConfig &mem_config, size_t num_hosts, size_t workers_per_host, size_t core_offset, const std::function< void(Context &)> &job_startpoint)
Generic runner for backends supporting loopback tests.
Definition: context.cpp:136

thrill::api::HostContext::mem_manager
mem::Manager & mem_manager()
host-global memory manager
Definition: context.hpp:126

thrill::api::Context::GetNewCatStream
data::CatStreamPtr GetNewCatStream(size_t dia_id)
Definition: context.cpp:1209

thrill::data::start_block_size
size_t start_block_size
starting size of blocks in BlockWriter.
Definition: byte_block.cpp:24

tlx::setenv
int setenv(const char *name, const char *value, int overwrite)
setenv - change or add an environment variable Windows porting madness because setenv() is apparently...
Definition: setenv.cpp:31

thrill::api::HostContext::~HostContext
~HostContext()
destructor
Definition: context.cpp:1149

thrill::common::GetHostname
std::string GetHostname()
get hostname
Definition: porting.cpp:143

thrill::api::HostContext::base_logger_
common::JsonLogger base_logger_
base logger exclusive for this host context
Definition: context.hpp:153

foxxll::stats_data::get_write_bytes
external_size_type get_write_bytes() const
Definition: iostats.cpp:543

tlx::parse_si_iec_units
bool parse_si_iec_units(const char *str, uint64_t *out_size, char default_unit)
Parse a string like "343KB" or "44 GiB" into the corresponding size in bytes.
Definition: parse_si_iec_units.cpp:17

thrill::api::HostContext::workers_per_host
size_t workers_per_host() const
number of workers per host (all have the same).
Definition: context.hpp:115

thrill::api::RunLocalSameThread
void RunLocalSameThread(const std::function< void(Context &)> &job_startpoint)
Runs the given job_startpoint within the same thread with a test network –> run test with one host a...
Definition: context.cpp:376

thrill::api::Context::local_worker_id_
size_t local_worker_id_
number of this host context, 0..p-1, within this host
Definition: context.hpp:398

iostats.hpp

thrill::api::MemoryConfig::ram_block_pool_hard_
size_t ram_block_pool_hard_
amount of RAM dedicated to data::BlockPool – hard limit
Definition: context.hpp:66

thrill::mem::make_unique
unique_ptr< T > make_unique(Manager &manager, Args &&... args)
make_unique with Manager tracking
Definition: allocator.hpp:212

thrill::api::RunLocalMock
void RunLocalMock(const MemoryConfig &mem_config, size_t num_hosts, size_t workers_per_host, const std::function< void(Context &)> &job_startpoint)
Function to run a number of mock hosts as locally independent threads, which communicate via internal...
Definition: context.cpp:299

thrill::common::StartLinuxProcStatsProfiler
void StartLinuxProcStatsProfiler(ProfileThread &, JsonLogger &)
launch profiler task
Definition: linux_proc_stats.cpp:860

tlx::abs_diff
T abs_diff(const T &a, const T &b)
absolute difference, which also works for unsigned types
Definition: abs_diff.hpp:24

thrill::api::SetupBlockSize
static bool SetupBlockSize()
Definition: context.cpp:179

thrill::vfs::Deinitialize
void Deinitialize()
Deinitialize VFS layer.
Definition: file_io.cpp:40

thrill::api::Context::logger_
common::JsonLogger logger_
Definition: context.hpp:462

thrill::net::FlowControlChannel::Reduce
T TLX_ATTRIBUTE_WARN_UNUSED_RESULT Reduce(const T &value, size_t root=0, const BinarySumOp &sum_op=BinarySumOp())
Reduces a value of a serializable type T over all workers to the given worker, provided a certain red...
Definition: flow_control_channel.hpp:543

thrill::api::MemoryConfig::ram_workers_
size_t ram_workers_
Definition: context.hpp:73

thrill::api::RunNotSupported
int RunNotSupported(const char *env_net)
Definition: context.cpp:815

thrill::mem::string
std::basic_string< char, std::char_traits< char >, Allocator< char > > string
string with Manager tracking
Definition: allocator.hpp:220

abs_diff.hpp

split.hpp

foxxll::singleton< stats >::get_instance
static instance_pointer get_instance()
return instance or create base instance if empty
Definition: singleton.hpp:41

thrill::api::Context::local_worker_id
size_t local_worker_id() const
Definition: context.hpp:263

thrill::net::tcp::Group::ConstructLoopbackMesh
static std::vector< std::unique_ptr< Group > > ConstructLoopbackMesh(size_t num_hosts)
Construct a test network with an underlying full mesh of local loopback stream sockets for testing...
Definition: group.cpp:36

thrill::api::Context::GetFilePtr
data::FilePtr GetFilePtr(size_t dia_id)
Definition: context.cpp:1200

thrill::data::Multiplexer::GetNewMixStream
MixStreamPtr GetNewMixStream(size_t local_worker_id, size_t dia_id)
Request next stream.
Definition: multiplexer.cpp:227

thrill::api::RunLocalTests
void RunLocalTests(const std::function< void(Context &)> &job_startpoint)
Helper Function to execute RunLocalMock() tests using mock networks in test suite for many different ...
Definition: context.cpp:319

thrill::api::MemoryConfig::apply
void apply()
Definition: context.cpp:1082

thrill::net::mpi::MpiRank
size_t MpiRank()
Return the rank of this process in the MPI COMM WORLD.
Definition: group.cpp:714

tlx::CountingPtr< File >

thrill::net::Manager::Traffic
net::Traffic Traffic() const
calculate overall traffic for final stats
Definition: group.cpp:67

thrill::api::Context::my_rank
size_t my_rank() const
Global rank of this worker among all other workers in the system.
Definition: context.hpp:243

thrill::net::tcp::Construct
void Construct(SelectDispatcher &dispatcher, size_t my_rank, const std::vector< std::string > &endpoints, std::unique_ptr< Group > *groups, size_t group_count)
Definition: construct.cpp:543

thrill::api::FindWorkersPerHost
static size_t FindWorkersPerHost(const char *&str_workers_per_host, const char *&env_workers_per_host)
Definition: context.cpp:204

thrill::api::Context::Context
Context(HostContext &host_context, size_t local_worker_id)
Definition: context.cpp:1179

thrill::api::Context::GetFile
data::File GetFile(size_t dia_id)
Returns a new File object containing a sequence of local Blocks.
Definition: context.hpp:283

thrill::api::Context::GetNewMixStream
data::MixStreamPtr GetNewMixStream(size_t dia_id)
Definition: context.cpp:1217

thrill::common::to_str
static std::string to_str(const Type &t)
Definition: string.hpp:36

thrill::api::DIABase::dia_id
const size_t & dia_id() const
return unique id of DIANode subclass as stored by StatsNode
Definition: dia_base.hpp:213

math.hpp

thrill::api::HostContext::flow_manager
net::FlowControlChannelManager & flow_manager()
the flow control group is used for collective communication.
Definition: context.hpp:136

thrill::api::Context::Launch
void Launch(const std::function< void(Context &)> &job_startpoint)
method used to launch a job&#39;s main procedure. it wraps it in log output.
Definition: context.cpp:1275

thrill::api::Context::multiplexer_
data::Multiplexer & multiplexer_
data::Multiplexer instance that is shared among workers
Definition: context.hpp:422

thrill::api::MemoryConfig::ram_block_pool_soft_
size_t ram_block_pool_soft_
amount of RAM dedicated to data::BlockPool – soft limit
Definition: context.hpp:69

thrill::api::Context::host_rank
size_t host_rank() const
Definition: context.hpp:257

thrill::api::RunSetupFoxxll
void RunSetupFoxxll()
Definition: context.cpp:940

thrill::net::Manager::kGroupCount
static constexpr size_t kGroupCount
The count of net::Groups to initialize.
Definition: manager.hpp:61

thrill::api::HostContext::flow_manager_
net::FlowControlChannelManager flow_manager_
the flow control group is used for collective communication.
Definition: context.hpp:189

foxxll::disk_config
Definition: config.hpp:36

thrill::api::HostContext::mem_manager_
mem::Manager mem_manager_
host-global memory manager for internal memory only
Definition: context.hpp:173

thrill::api::HostContext
The HostContext contains all data structures shared among workers on the same host.
Definition: context.hpp:90

format_si_iec_units.hpp

thrill::api::MemoryConfig::setup
void setup(size_t ram)
setup memory size
Definition: context.cpp:1018

construct.hpp

thrill::api::RunBackendLoopback
static int RunBackendLoopback(const char *backend, const std::function< void(Context &)> &job_startpoint)
Run() implementation which uses a loopback net backend ("mock" or "tcp").
Definition: context.cpp:419

thrill::api::HostContext::local_host_id
size_t local_host_id() const
Returns local_host_id_.
Definition: context.hpp:112

TLX_LOG1
#define TLX_LOG1
Definition: core.hpp:145

thrill
Definition: action_node.hpp:21

thrill::common::StatsTimerBaseStarted
Definition: stats_timer.hpp:271

thrill::api::HostContext::ConstructLoopback
static std::vector< std::unique_ptr< HostContext > > ConstructLoopback(size_t num_hosts, size_t workers_per_host)
Construct a number of mock hosts running in this process.
Definition: context.cpp:308

thrill::api::HostContext::mem_config
MemoryConfig & mem_config()
host-global memory config
Definition: context.hpp:123

thrill::net::Traffic::rx
size_t rx
received bytes
Definition: manager.hpp:37

thrill::net::mpi::NumMpiProcesses
size_t NumMpiProcesses()
Return the number of MPI processes.
Definition: group.cpp:701

thrill::api::Initialize
static bool Initialize()
Definition: context.cpp:274

thrill::api::HostContext::mem_config_
MemoryConfig mem_config_
memory configuration
Definition: context.hpp:146

group.hpp

thrill::api::HostContext::block_pool_
data::BlockPool block_pool_
data block pool
Definition: context.hpp:194

foxxll::disk_config::autogrow
bool autogrow
autogrow file if more disk space is needed, automatically set if size == 0.
Definition: config.hpp:78

thrill::api::HostContext::profiler_
std::unique_ptr< common::ProfileThread > profiler_
thread for scheduling profiling methods for statistical output
Definition: context.hpp:161

thrill::api::MemoryConfig::enable_proc_profiler_
bool enable_proc_profiler_
enable Linux /proc stats profiler (default: on)
Definition: context.hpp:82

thrill::api::HostContext::dispatcher_
std::unique_ptr< net::DispatcherThread > dispatcher_
main host network dispatcher thread backend
Definition: context.hpp:176

thrill::api::Context::base_logger_
common::JsonLogger base_logger_
base logger exclusive for this worker
Definition: context.hpp:457

thrill::api::HostContext::host_rank
size_t host_rank() const
Definition: context.hpp:133

thrill::common::SetCpuAffinity
void SetCpuAffinity(std::thread &thread, size_t cpu_id)
set cpu/core affinity of a thread
Definition: porting.cpp:111

thrill::api::HostContext::net_manager_
net::Manager net_manager_
net manager constructs communication groups to other hosts.
Definition: context.hpp:179

tlx::format_iec_units
std::string format_iec_units(uint64_t number, int precision=3)
Format number as something like 1 TiB.
Definition: format_si_iec_units.cpp:38

thrill::api::HostContext::local_host_id_
size_t local_host_id_
id among all local hosts (in test program runs)
Definition: context.hpp:167

thrill::api::HostContext::workers_per_host_
size_t workers_per_host_
number of workers per host (all have the same).
Definition: context.hpp:170

thrill::api::DetectNetBackend
static const char * DetectNetBackend()
Definition: context.cpp:822

thrill::api::MemoryConfig::verbose_
bool verbose_
StageBuilder verbosity flag.
Definition: context.hpp:79

thrill::api::Context::block_pool
data::BlockPool & block_pool()
the block manager keeps all data blocks moving through the system.
Definition: context.hpp:324

foxxll::stats_data
Definition: iostats.hpp:486

thrill::net::mpi::Construct
bool Construct(size_t group_size, DispatcherThread &dispatcher, std::unique_ptr< Group > *groups, size_t group_count)
Construct Group which connects to peers using MPI.
Definition: group.cpp:675

thrill::net::Traffic::tx
size_t tx
transmitted bytes
Definition: manager.hpp:35