Improve cpu sets and documentation

parttimenerd · Aug 2, 2019 · 9216300 · 9216300
1 parent 6ba38f7
commit 9216300
Show file tree

Hide file tree

Showing 4 changed files with 59 additions and 31 deletions.
diff --git a/doc/temci_exec.rst b/doc/temci_exec.rst
@@ -365,7 +365,7 @@ flags are of the schema ``--SETTING/--no-SETTING``):
         active:         Bool()
 
         # Number of cpu cores for the base (remaining part of the) system
-        base_core_number:         Int(range=range(0, 8))
+        base_core_number:         Int(range=range(0, NUMBER OF CPUS))
                     default: 1
 
         #   0: benchmark sequential
@@ -374,9 +374,13 @@ flags are of the schema ``--SETTING/--no-SETTING``):
         parallel:         Int()
 
         # Number of cpu cores per parallel running program.
-        sub_core_number:         Int(range=range(0, 8))
+        sub_core_number:         Int(range=range(0, NUMBER OF CPUS))
                     default: 1
 
+        # Place temci in the same cpu set as the rest of the system?
+        temci_in_base_set:  Bool()
+                    default: True
+
      # Maximum runs per tag (block attribute 'tag'), min('max_runs', 'per_tag') is used
     max_runs_per_tag:         Dict(, keys=Str(), values=Int(), default = {})
 
@@ -706,6 +710,8 @@ plugins already available:
     Disables the turbo mode on Intel CPUs
 :ref:`disable_swap`
     Disables swapping data from the RAM into a backing hard drive
+:ref:`discarded_runs`
+    Discard the first runs (sets the ``run/discarded_runs`` setting)
 :ref:`drop_fs_caches`
     Drops file system caches
 :ref:`env_randomize`
@@ -789,6 +795,11 @@ variance as accessing data on a hard drive is significantly slower than accessin
 
 Requires root privileges.
 
+discarded_runs
+~~~~~~~~~~~~~~
+Discard the first runs (sets the ``run/discarded_runs`` setting).
+As a result, the benchmark files should already be in the file system caches.
+
 drop_fs_caches
 ~~~~~~~~~~~~~~
 Drops the page cache, directoy entries and inodes before every benchmarking run. This might improve the usability
@@ -887,6 +898,10 @@ Preheats the system with a CPU bound task (calculating the inverse of a big rand
 The length of the preheating can be configured by either using the ``--preheat_time SECONDS`` option or by
 setting ``run/exec_plugins/preheat_misc/time``.
 
+When the preheating takes place (before each run or at the beginning of the benchmarking) can
+be configured via ``--preheat_when [before_each_run|at_setup]`` or by setting
+``run/exec_plugins/preheat_misc/when`` (accepts a list).
+
 sleep
 ~~~~~
 Keep the system idle for some time before the actual benchmarking.
@@ -983,4 +998,9 @@ can also be set using the options with the same names prefixed with ``--cpuset_`
     sub_core_number:         Int(range=range(0, 8))
                 default: 1
 
+    # Place temci in the same cpu set as the rest of the system?
+    temci_in_base_set:  Bool()
+                default: True
+
+
 This functionality can also be enabling by using the ``--cpuset`` flag or by enabling the :ref:`cpuset` plugin.
diff --git a/temci/run/cpuset.py b/temci/run/cpuset.py
@@ -28,18 +28,20 @@ class CPUSet:
     """
 
     def __init__(self, active: bool = True, base_core_number: int = None,
-                 parallel: int = None, sub_core_number: int = None):
+                 parallel: int = None, sub_core_number: int = None,
+                 temci_in_base_set: bool = True):
         """
         Initializes the cpu sets an determines the number of parallel programs (parallel_number variable).
 
         :param active: are cpu sets actually used?
         :param base_core_number: number of cpu cores for the base (remaining part of the) system
         :param parallel: 0: benchmark sequential, > 0: benchmark parallel with n instances, -1: determine n automatically
         :param sub_core_number: number of cpu cores per parallel running program
+        :param temci_in_base_set: place temci in the same cpu set as the rest of the system?
         :raises ValueError: if the passed parameters don't work together on the current platform
         :raises EnvironmentError: if the environment can't be setup properly (e.g. no root privileges)
         """
-        #self.bench_set = "bench.set"
+        # self.bench_set = "bench.set"
         self.active = active and has_root_privileges()  # type: bool
         """ Are cpu sets actually used? """
         self.base_core_number = Settings().default(base_core_number, "run/cpuset/base_core_number")  # type: int
@@ -48,21 +50,23 @@ def __init__(self, active: bool = True, base_core_number: int = None,
         """ 0: benchmark sequential, > 0: benchmark parallel with n instances, -1: determine n automatically """
         self.sub_core_number = Settings().default(sub_core_number, "run/cpuset/sub_core_number")  # type: int
         """ Number of cpu cores per parallel running program """
-        self.av_cores = len(self._cpus_of_set("")) if active else multiprocessing.cpu_count()  # zype: int
+        self.av_cores = len(self._cpus_of_set("")) if active else multiprocessing.cpu_count()  # type: int
         """ Number of available cpu cores """
         self.parallel_number = 0  # type: int
         """ Number of used parallel instances, zero if the benchmarking is done sequentially """
+        self.temci_in_base_set = Settings().default(temci_in_base_set, "run/cpuset/temci_in_base_set")
+        """ Place temci in the same cpu set as the rest of the system? """
         if self.parallel != 0:
             if self.parallel == -1:
                 self.parallel_number = self._number_of_parallel_sets(self.base_core_number,
                                                                      True, self.sub_core_number)
             else:
                 self.parallel_number = self.parallel
-                if self.parallel > self._number_of_parallel_sets(self.base_core_number, True, self.sub_core_number)\
+                if self.parallel > self._number_of_parallel_sets(self.base_core_number, True, self.sub_core_number) \
                         and self.active:
                     raise ValueError("Invalid values for base_core_number and sub_core_number "
-                             "on system with just {} cores. Note: The benchmark controller "
-                             "needs a cpuset too.".format(self.av_cores))
+                                     "on system with just {} cores. Note: The benchmark controller "
+                                     "needs a cpuset too.".format(self.av_cores))
             self.base_core_number = self.av_cores - self.sub_core_number * self.parallel_number - 1
         if not self.active:
             if active and not has_root_privileges():
@@ -72,7 +76,7 @@ def __init__(self, active: bool = True, base_core_number: int = None,
         typecheck(self.base_core_number, PositiveInt())
         typecheck(self.parallel_number, NaturalNumber())
         self.own_sets = [SUB_BENCH_SET.format(i) for i in range(0, self.parallel_number)] \
-                   + [CONTROLLER_SUB_BENCH_SET, NEW_ROOT_SET, BENCH_SET]
+                        + [CONTROLLER_SUB_BENCH_SET, NEW_ROOT_SET, BENCH_SET]
         try:
             self._init_cpuset()
         except BaseException:
@@ -116,7 +120,7 @@ def teardown(self):
                 self._delete_set(set)
             except EnvironmentError as ex:
                 pass
-                #logging.error(str(ex))
+                # logging.error(str(ex))
             except BaseException:
                 raise
 
@@ -125,11 +129,13 @@ def _number_of_parallel_sets(self, base_core_number: int, parallel: bool, sub_co
         Calculates the number of possible parallel sets.
         """
         typecheck([base_core_number, parallel, sub_core_number], List(Int()))
-        if base_core_number + 1 + sub_core_number > self.av_cores and self.active:
+        if base_core_number + (0 if self.temci_in_base_set else 1) + sub_core_number > self.av_cores and self.active:
             raise ValueError("Invalid values for base_core_number and sub_core_number "
-                             "on system with just {} cores. Note: The benchmark controller"
-                             "needs a cpuset too.".format(self.av_cores))
-        av_cores_for_par = self.av_cores - base_core_number - 1
+                             "on system with just {} cores.{}".format(self.av_cores,
+                                                                      ""
+                                                                      if self.temci_in_base_set
+                                                                      else "Note: temci needs a cpuset too."))
+        av_cores_for_par = self.av_cores - base_core_number - (0 if self.temci_in_base_set else 1)
         if parallel:
             return av_cores_for_par // sub_core_number
         return 1
@@ -142,9 +148,9 @@ def _init_cpuset(self):
             if not os.path.exists(CPUSET_DIR):
                 os.mkdir(CPUSET_DIR)
             proc = subprocess.Popen(["bash", "-c", "mount -t cpuset none /cpuset/"],
-                                stdout=subprocess.DEVNULL,
-                                stderr=subprocess.PIPE,
-                                universal_newlines=True)
+                                    stdout=subprocess.DEVNULL,
+                                    stderr=subprocess.PIPE,
+                                    universal_newlines=True)
             out, err = proc.communicate()
             if proc.poll() > 0:
                 raise EnvironmentError(
@@ -153,13 +159,13 @@ def _init_cpuset(self):
         self._create_cpuset(NEW_ROOT_SET, self._get_av_cpus()[0: self.base_core_number])
         logging.info("Move all processes to new root cpuset")
         self._move_all_to_new_root()
-        if self.parallel == 0: # just use all available cores, as the benchmarked program also runs in it
+        if self.parallel == 0:  # just use all available cores, as the benchmarked program also runs in it
             self._create_cpuset(CONTROLLER_SUB_BENCH_SET, self._get_av_cpus()[self.base_core_number:self.av_cores])
         else:
             self._create_cpuset(CONTROLLER_SUB_BENCH_SET, self._get_av_cpus()[self.base_core_number:1])
-        self._move_process_to_set(CONTROLLER_SUB_BENCH_SET)
+        self._move_process_to_set(NEW_ROOT_SET if self.temci_in_base_set else CONTROLLER_SUB_BENCH_SET)
         for i in range(0, self.parallel_number):
-            start = self.base_core_number + 1 + (i * self.sub_core_number)
+            start = self.base_core_number + (0 if self.temci_in_base_set else 1) + (i * self.sub_core_number)
             self._create_cpuset(SUB_BENCH_SET.format(i), self._get_av_cpus()[start:start + self.sub_core_number])
 
     def _cpus_of_set(self, name: str) -> t.Optional[t.List[int]]:
@@ -202,19 +208,19 @@ def _move_all_to_new_root(self, name: str = 'root', _count: int = 100):
         :param name: name of the root cpu set
         :param _count: maximum cpu set tree depth
         """
-        cpus =  self._get_av_cpus()[0:self.base_core_number]
+        cpus = self._get_av_cpus()[0:self.base_core_number]
         self._set_cpu_affinity_of_set(name, cpus)
         if _count > 0:
             for child in self._child_sets(name):
                 if len(child) > 1:
-                    #print("moved from {child} to {root}".format(child=child, root=NEW_ROOT_SET))
+                    # print("moved from {child} to {root}".format(child=child, root=NEW_ROOT_SET))
                     try:
                         self._move_all_to_new_root(child, _count - 1)
                     except EnvironmentError as err:
                         pass
-                        #logging.warning(str(err))
+                        # logging.warning(str(err))
         self._move_processes(name, NEW_ROOT_SET)
-        #if _count == 100:
+        # if _count == 100:
         #    self._cset("proc --move -k --force --threads --pid=0-100000 --toset={}".format(NEW_ROOT_SET))
 
     def _move_processes(self, from_set: str, to_set: str):
@@ -275,15 +281,15 @@ def _set_cpu_affinity_of_set(self, set: str, cpus: t.List[int]):
         """ Set the cpu affinity for all processes that belong to the given set """
         if set == "root":
             set = ""
-        app = "cgroup.procs"  if set == "" else set + "/cgroup.procs"
+        app = "cgroup.procs" if set == "" else set + "/cgroup.procs"
         with open(os.path.join(CPUSET_DIR + "/" + app), "r") as f:
             for line in f.readlines():
                 try:
                     self._set_cpu_affinity(int(line.strip()), cpus)
-                    #logging.info("success {}".format(line))
+                    # logging.info("success {}".format(line))
                 except EnvironmentError as err:
                     pass
-                    #logging.error(str(err))
+                    # logging.error(str(err))
 
     def _set_cpu_affinity(self, pid: int, cpus: t.List[int]):
         """ Set the cpu affinity for the given process to the given cpu cores """
@@ -294,7 +300,7 @@ def _set_cpu_affinity(self, pid: int, cpus: t.List[int]):
                                 universal_newlines=True)
         out, err = proc.communicate()
         if proc.poll() > 0:
-            raise EnvironmentError (
+            raise EnvironmentError(
                 "taskset error (cmd = '{}'): ".format(cmd) + str(err) + str(out)
             )
         return str(out)
@@ -307,7 +313,7 @@ def _cset(self, argument: str):
         :return: output of executing the combined command
         :raises EnvironmentError: if something goes wrong
         """
-        #cmd = ["/bin/sh", "-c", "sudo cset {}".format(argument)]
+        # cmd = ["/bin/sh", "-c", "sudo cset {}".format(argument)]
         cmd = ["/bin/sh", "-c", "python3 -c 'import cpuset.main; print(cpuset.main.main())' " + argument]
         proc = subprocess.Popen(cmd,
                                 stdout=subprocess.PIPE,

diff --git a/temci/run/run_driver_plugin.py b/temci/run/run_driver_plugin.py
@@ -12,6 +12,7 @@
 import subprocess, logging, os, signal, random, multiprocessing, time
 import typing as t
 
+
 class AbstractRunDriverPlugin:
     """
     A plugin for a run driver. It allows additional modifications.
@@ -161,7 +162,6 @@ def setup(self):
     def setup_block(self, block: RunProgramBlock, runs: int = 1):
         if "before_each_run" in self.misc_settings["when"]:
             block["cmd_prefix"].append(self._command())
-            print(block["cmd_prefix"])
 
     def _command(self) -> str:
         heat_time = self.misc_settings["time"]

diff --git a/temci/utils/settings.py b/temci/utils/settings.py
@@ -121,7 +121,9 @@ class Settings(metaclass=Singleton):
                                                       "> 0: benchmark parallel with n instances, "
                                                       "-1: determine n automatically") // Default(0),
                 "sub_core_number": ValidCPUCoreNumber() // Description("Number of cpu cores per parallel running program.")
-                                   // Default(1)
+                                   // Default(1),
+                "temci_in_base_set": Bool() // Default(True)
+                                     // Description("place temci in the same cpu set as the rest of the system?")
             }),
             "disable_hyper_threading": Bool() // Default(False)
                                        // Description("Disable the hyper threaded cores. Good for cpu bound programs."),