Skip to content

Commit

Permalink
added logic to find num_workers for autoscaling clusters (#647)
Browse files Browse the repository at this point in the history
Signed-off-by: cindyyuanjiang <[email protected]>
  • Loading branch information
cindyyuanjiang authored Nov 3, 2023
1 parent ebca530 commit 2f1a9fb
Show file tree
Hide file tree
Showing 2 changed files with 26 additions and 0 deletions.
13 changes: 13 additions & 0 deletions user_tools/src/spark_rapids_pytools/cloud_api/databricks_aws.py
Original file line number Diff line number Diff line change
Expand Up @@ -205,7 +205,20 @@ def _init_nodes(self):
master_nodes_from_conf = self.props.get_value_silent('driver')
worker_nodes_from_conf = self.props.get_value_silent('executors')
num_workers = self.props.get_value_silent('num_workers')
if num_workers is None and self.props.get_value_silent('autoscale') is not None:
target_workers = self.props.get_value_silent('autoscale', 'target_workers')
# use min_workers since it is usually the same as target_workers
min_workers = self.props.get_value_silent('autoscale', 'min_workers')
if target_workers is not None:
num_workers = target_workers
self.logger.info('Autoscaling cluster, will set number of workers to target_workers = %s',
num_workers)
elif min_workers is not None:
num_workers = min_workers
self.logger.info('Autoscaling cluster, will set number of workers to min_workers = %s',
num_workers)
if num_workers is None:
self.logger.info('Unable to find number of workers for cluster, will default to 0')
num_workers = 0
# construct master node info when cluster is inactive
if master_nodes_from_conf is None:
Expand Down
13 changes: 13 additions & 0 deletions user_tools/src/spark_rapids_pytools/cloud_api/databricks_azure.py
Original file line number Diff line number Diff line change
Expand Up @@ -289,7 +289,20 @@ def _init_nodes(self):
driver_nodes_from_conf = self.props.get_value_silent('driver')
worker_nodes_from_conf = self.props.get_value_silent('executors')
num_workers = self.props.get_value_silent('num_workers')
if num_workers is None and self.props.get_value_silent('autoscale') is not None:
target_workers = self.props.get_value_silent('autoscale', 'target_workers')
# use min_workers since it is usually the same as target_workers
min_workers = self.props.get_value_silent('autoscale', 'min_workers')
if target_workers is not None:
num_workers = target_workers
self.logger.info('Autoscaling cluster, will set number of workers to target_workers = %s',
num_workers)
elif min_workers is not None:
num_workers = min_workers
self.logger.info('Autoscaling cluster, will set number of workers to min_workers = %s',
num_workers)
if num_workers is None:
self.logger.info('Unable to find number of workers for cluster, will default to 0')
num_workers = 0
# construct driver node info when cluster is inactive
if driver_nodes_from_conf is None:
Expand Down

0 comments on commit 2f1a9fb

Please sign in to comment.