Skip to content

Commit

Permalink
Remove default mkl settings when start ray (intel-analytics#1837)
Browse files Browse the repository at this point in the history
  • Loading branch information
hkvision committed Dec 12, 2019
1 parent 566f754 commit f9e9740
Showing 1 changed file with 7 additions and 27 deletions.
34 changes: 7 additions & 27 deletions python/orca/src/bigdl/orca/ray/util/raycontext.py
Original file line number Diff line number Diff line change
Expand Up @@ -55,43 +55,31 @@ class RayServiceFuncGenerator(object):
"""
This should be a pickable class.
"""

def _get_MKL_config(self, cores):
return {"intra_op_parallelism_threads": str(cores),
"inter_op_parallelism_threads": str(cores),
"OMP_NUM_THREADS": str(cores),
"KMP_BLOCKTIME": "0",
"KMP_AFFINITY": "granularity = fine, verbose, compact, 1, 0",
"KMP_SETTINGS": "0"}

def _prepare_env(self, cores=None):
def _prepare_env(self):
modified_env = os.environ.copy()
if self.env:
modified_env.update(self.env)
cwd = os.getcwd()
modified_env["PATH"] = "{}/{}:{}".format(cwd, "/".join(self.python_loc.split("/")[:-1]),
os.environ["PATH"])
modified_env.pop("MALLOC_ARENA_MAX", None)
modified_env.pop("RAY_BACKEND_LOG_LEVEL", None)
# unset all MKL setting
# Unset all MKL setting as Analytics Zoo would give default values when init env.
# Running different programs may need different configurations.
modified_env.pop("intra_op_parallelism_threads", None)
modified_env.pop("inter_op_parallelism_threads", None)
modified_env.pop("OMP_NUM_THREADS", None)
modified_env.pop("KMP_BLOCKTIME", None)
modified_env.pop("KMP_AFFINITY", None)
modified_env.pop("KMP_SETTINGS", None)
if cores:
cores = int(cores)
print("MKL cores is {}".format(cores))
modified_env.update(self._get_MKL_config(cores))
if self.env: # Add in env argument if any MKL setting is needed.
modified_env.update(self.env)
if self.verbose:
print("Executing with these environment setting:")
for pair in modified_env.items():
print(pair)
print("The $PATH is: {}".format(modified_env["PATH"]))
return modified_env

def __init__(self, python_loc, redis_port, ray_node_cpu_cores, mkl_cores,
def __init__(self, python_loc, redis_port, ray_node_cpu_cores,
password, object_store_memory, waitting_time_sec=6, verbose=False, env=None,
extra_params=None):
"""object_store_memory: integer in bytes"""
Expand All @@ -100,7 +88,6 @@ def __init__(self, python_loc, redis_port, ray_node_cpu_cores, mkl_cores,
self.redis_port = redis_port
self.password = password
self.ray_node_cpu_cores = ray_node_cpu_cores
self.mkl_cores = mkl_cores
self.ray_exec = self._get_ray_exec()
self.object_store_memory = object_store_memory
self.waiting_time_sec = waitting_time_sec
Expand Down Expand Up @@ -150,7 +137,7 @@ def _get_raylet_command(redis_address,
extra_params=extra_params)

def _start_ray_node(self, command, tag, wait_before=5, wait_after=5):
modified_env = self._prepare_env(self.mkl_cores)
modified_env = self._prepare_env()
print("Starting {} by running: {}".format(tag, command))
print("Wait for {} sec before launching {}".format(wait_before, tag))
time.sleep(wait_before)
Expand Down Expand Up @@ -239,7 +226,6 @@ def __init__(self, sc, redis_port=None, password="123456", object_store_memory=N
python_loc=self.python_loc,
redis_port=self.redis_port,
ray_node_cpu_cores=self.ray_node_cpu_cores,
mkl_cores=self._get_mkl_cores(),
password=password,
object_store_memory=self._enrich_object_sotre_memory(sc, object_store_memory),
verbose=verbose,
Expand Down Expand Up @@ -302,12 +288,6 @@ def purge(self):
self.ray_service.gen_stop()).collect()
self.stopped = True

def _get_mkl_cores(self):
if self.is_local:
return 1
else:
return int(self.sc._conf.get("spark.executor.cores"))

def _get_ray_node_cpu_cores(self):
if self.is_local:

Expand Down

0 comments on commit f9e9740

Please sign in to comment.