From f8521eff04b808a1ff2cbe7c18e8d3d2d5dc59a3 Mon Sep 17 00:00:00 2001
From: cindyyuanjiang <cindyj@nvidia.com>
Date: Thu, 21 Sep 2023 13:43:24 -0700
Subject: [PATCH 1/4] initial implementation for adding discount options for
 both ascli and spark_rapids_user_tools

Signed-off-by: cindyyuanjiang <cindyj@nvidia.com>
---
 .../rapids/qualification.py                   | 43 +++++++++++++++++++
 .../wrappers/databricks_aws_wrapper.py        | 18 ++++++--
 .../wrappers/databricks_azure_wrapper.py      | 18 ++++++--
 .../wrappers/dataproc_wrapper.py              | 14 +++++-
 .../wrappers/emr_wrapper.py                   | 14 +++++-
 .../wrappers/onprem_wrapper.py                | 14 +++++-
 .../spark_rapids_tools/cmdli/argprocessor.py  | 11 ++++-
 .../src/spark_rapids_tools/cmdli/tools_cli.py | 12 ++++++
 8 files changed, 134 insertions(+), 10 deletions(-)

diff --git a/user_tools/src/spark_rapids_pytools/rapids/qualification.py b/user_tools/src/spark_rapids_pytools/rapids/qualification.py
index a8861c6a1..b5ba44d4a 100644
--- a/user_tools/src/spark_rapids_pytools/rapids/qualification.py
+++ b/user_tools/src/spark_rapids_pytools/rapids/qualification.py
@@ -291,6 +291,46 @@ def __process_filter_args(self, arg_val: str):
                 selected_filter = QualFilterApp.fromstring(default_filter_txt)
         self.ctxt.set_ctxt('filterApps', selected_filter)
 
+    def _process_price_discount_args(self):
+        raw_cpu_discount = self.wrapper_options.get('cpuDiscount')
+        raw_gpu_discount = self.wrapper_options.get('gpuDiscount')
+        raw_global_discount = self.wrapper_options.get('globalDiscount')
+        if raw_global_discount != None and (raw_cpu_discount != None or raw_gpu_discount != None):
+            self.logger.error('Setting both global_discount and either cpu_discount or '
+                              'gpu_discount is inconsistent.')
+            raise RuntimeError('Invalid arguments. If global_discount is specified, no additional '
+                               'discount arguments (cpu_discount or gpu_discount) should be set.')
+        try:
+            cpu_discount = int(raw_cpu_discount) if raw_cpu_discount != None else 0
+            gpu_discount = int(raw_gpu_discount) if raw_gpu_discount != None else 0
+            global_discount = int(raw_global_discount) if raw_global_discount != None else 0
+        except Exception as ex:
+            self.logger.error('Invalid arguments. Failed to process discount arguments: %s', ex)
+            raise ex
+
+        if cpu_discount < 0 or cpu_discount > 100:
+            self.logger.error('cpu_discount is out of range [0, 100]')
+            raise RuntimeError(f'Invalid arguments. cpu_discount = {cpu_discount} is an invalid '
+                               'percentage.')
+        if gpu_discount < 0 or gpu_discount > 100:
+            self.logger.error('gpu_discount is out of range [0, 100]')
+            raise RuntimeError(f'Invalid arguments. gpu_discount = {gpu_discount} is an invalid '
+                               'percentage.')
+        if global_discount < 0 or global_discount > 100:
+            self.logger.error('global_discount is out of range [0, 100]')
+            raise RuntimeError(f'Invalid arguments. global_discount = {global_discount} is an invalid '
+                               'percentage.')
+
+        if global_discount != 0:
+            self.ctxt.set_ctxt('cpu_discount', global_discount)
+            self.ctxt.set_ctxt('gpu_discount', global_discount)
+        else:
+            self.ctxt.set_ctxt('cpu_discount', cpu_discount)
+            self.ctxt.set_ctxt('gpu_discount', gpu_discount)
+
+        self.logger.info("cpu_discount = %s", cpu_discount)
+        self.logger.info("gpu_discount = %s", gpu_discount)
+
     def _process_custom_args(self):
         """
         Qualification tool processes extra arguments:
@@ -322,6 +362,7 @@ def _process_custom_args(self):
 
         self._process_offline_cluster_args()
         self._process_eventlogs_args()
+        self._process_price_discount_args()
         # This is noise to dump everything
         # self.logger.debug('%s custom arguments = %s', self.pretty_name(), self.ctxt.props['wrapperCtx'])
 
@@ -530,6 +571,8 @@ def __calc_apps_cost(self,
         def get_costs_for_single_app(df_row, estimator: SavingsEstimator) -> pd.Series:
             cpu_cost, gpu_cost, est_savings = estimator.get_costs_and_savings(df_row['App Duration'],
                                                                               df_row['Estimated GPU Duration'])
+            cpu_cost = (100 - self.ctxt.get_ctxt('cpu_discount')) / 100 * cpu_cost
+            gpu_cost = (100 - self.ctxt.get_ctxt('gpu_discount')) / 100 * gpu_cost
             # We do not want to mistakenly mark a Not-applicable app as Recommended in the savings column
             if df_row[speedup_rec_col] == 'Not Applicable':
                 savings_recommendations = 'Not Applicable'
diff --git a/user_tools/src/spark_rapids_pytools/wrappers/databricks_aws_wrapper.py b/user_tools/src/spark_rapids_pytools/wrappers/databricks_aws_wrapper.py
index 083d5d56f..795d5763b 100644
--- a/user_tools/src/spark_rapids_pytools/wrappers/databricks_aws_wrapper.py
+++ b/user_tools/src/spark_rapids_pytools/wrappers/databricks_aws_wrapper.py
@@ -41,6 +41,9 @@ def qualification(cpu_cluster: str = None,
                           QualGpuClusterReshapeType.get_default()),
                       jvm_heap_size: int = 24,
                       verbose: bool = False,
+                      cpu_discount: int = None,
+                      gpu_discount: int = None,
+                      global_discount: int = None,
                       **rapids_options) -> None:
         """
         The Qualification tool analyzes Spark events generated from CPU based Spark applications to
@@ -86,9 +89,15 @@ def qualification(cpu_cluster: str = None,
                It accepts one of the following ("CLUSTER", "JOB" and the default value "MATCH").
                 "MATCH": keep GPU cluster same number of nodes as CPU cluster;
                 "CLUSTER": recommend optimal GPU cluster by cost for entire cluster;
-                "JOB": recommend optimal GPU cluster by cost per job
-        :param verbose: True or False to enable verbosity to the wrapper script.
+                "JOB": recommend optimal GPU cluster by cost per job.
         :param jvm_heap_size: The maximum heap size of the JVM in gigabytes.
+        :param verbose: True or False to enable verbosity to the wrapper script.
+        :param cpu_discount: A percent discount for the cpu cluster cost in the form of an integer value
+                (e.g. 30 for 30% discount).
+        :param gpu_discount: A percent discount for the gpu cluster cost in the form of an integer value
+                (e.g. 30 for 30% discount).
+        :param global_discount: A percent discount for both the cpu and gpu cluster costs in the form of an
+                integer value (e.g. 30 for 30% discount).
         :param rapids_options: A list of valid Qualification tool options.
                 Note that the wrapper ignores ["output-directory", "platform"] flags, and it does not support
                 multiple "spark-property" arguments.
@@ -119,7 +128,10 @@ def qualification(cpu_cluster: str = None,
             'eventlogs': eventlogs,
             'filterApps': filter_apps,
             'toolsJar': tools_jar,
-            'gpuClusterRecommendation': gpu_cluster_recommendation
+            'gpuClusterRecommendation': gpu_cluster_recommendation,
+            'cpuDiscount': cpu_discount,
+            'gpuDiscount': gpu_discount,
+            'globalDiscount': global_discount
         }
         QualificationAsLocal(platform_type=CspEnv.DATABRICKS_AWS,
                              cluster=None,
diff --git a/user_tools/src/spark_rapids_pytools/wrappers/databricks_azure_wrapper.py b/user_tools/src/spark_rapids_pytools/wrappers/databricks_azure_wrapper.py
index 87a9b2891..a0427989f 100644
--- a/user_tools/src/spark_rapids_pytools/wrappers/databricks_azure_wrapper.py
+++ b/user_tools/src/spark_rapids_pytools/wrappers/databricks_azure_wrapper.py
@@ -40,6 +40,9 @@ def qualification(cpu_cluster: str = None,
                           QualGpuClusterReshapeType.get_default()),
                       jvm_heap_size: int = 24,
                       verbose: bool = False,
+                      cpu_discount: int = None,
+                      gpu_discount: int = None,
+                      global_discount: int = None,
                       **rapids_options) -> None:
         """
         The Qualification tool analyzes Spark events generated from CPU based Spark applications to
@@ -84,9 +87,15 @@ def qualification(cpu_cluster: str = None,
                It accepts one of the following ("CLUSTER", "JOB" and the default value "MATCH").
                 "MATCH": keep GPU cluster same number of nodes as CPU cluster;
                 "CLUSTER": recommend optimal GPU cluster by cost for entire cluster;
-                "JOB": recommend optimal GPU cluster by cost per job
-        :param verbose: True or False to enable verbosity to the wrapper script.
+                "JOB": recommend optimal GPU cluster by cost per job.
         :param jvm_heap_size: The maximum heap size of the JVM in gigabytes.
+        :param verbose: True or False to enable verbosity to the wrapper script.
+        :param cpu_discount: A percent discount for the cpu cluster cost in the form of an integer value
+                (e.g. 30 for 30% discount).
+        :param gpu_discount: A percent discount for the gpu cluster cost in the form of an integer value
+                (e.g. 30 for 30% discount).
+        :param global_discount: A percent discount for both the cpu and gpu cluster costs in the form of an
+                integer value (e.g. 30 for 30% discount).
         :param rapids_options: A list of valid Qualification tool options.
                 Note that the wrapper ignores ["output-directory", "platform"] flags, and it does not support
                 multiple "spark-property" arguments.
@@ -116,7 +125,10 @@ def qualification(cpu_cluster: str = None,
             'eventlogs': eventlogs,
             'filterApps': filter_apps,
             'toolsJar': tools_jar,
-            'gpuClusterRecommendation': gpu_cluster_recommendation
+            'gpuClusterRecommendation': gpu_cluster_recommendation,
+            'cpuDiscount': cpu_discount,
+            'gpuDiscount': gpu_discount,
+            'globalDiscount': global_discount
         }
         QualificationAsLocal(platform_type=CspEnv.DATABRICKS_AZURE,
                              cluster=None,
diff --git a/user_tools/src/spark_rapids_pytools/wrappers/dataproc_wrapper.py b/user_tools/src/spark_rapids_pytools/wrappers/dataproc_wrapper.py
index 05ae9eb60..65b03e0b4 100644
--- a/user_tools/src/spark_rapids_pytools/wrappers/dataproc_wrapper.py
+++ b/user_tools/src/spark_rapids_pytools/wrappers/dataproc_wrapper.py
@@ -41,6 +41,9 @@ def qualification(cpu_cluster: str = None,
                           QualGpuClusterReshapeType.get_default()),
                       jvm_heap_size: int = 24,
                       verbose: bool = False,
+                      cpu_discount: int = None,
+                      gpu_discount: int = None,
+                      global_discount: int = None,
                       **rapids_options) -> None:
         """
         The Qualification tool analyzes Spark events generated from CPU based Spark applications to
@@ -87,6 +90,12 @@ def qualification(cpu_cluster: str = None,
                 "JOB": recommend optimal GPU cluster by cost per job
         :param jvm_heap_size: The maximum heap size of the JVM in gigabytes
         :param verbose: True or False to enable verbosity to the wrapper script
+        :param cpu_discount: A percent discount for the cpu cluster cost in the form of an integer value
+                (e.g. 30 for 30% discount).
+        :param gpu_discount: A percent discount for the gpu cluster cost in the form of an integer value
+                (e.g. 30 for 30% discount).
+        :param global_discount: A percent discount for both the cpu and gpu cluster costs in the form of an
+                integer value (e.g. 30 for 30% discount).
         :param rapids_options: A list of valid Qualification tool options.
                 Note that the wrapper ignores ["output-directory", "platform"] flags, and it does not support
                 multiple "spark-property" arguments.
@@ -114,7 +123,10 @@ def qualification(cpu_cluster: str = None,
             'eventlogs': eventlogs,
             'filterApps': filter_apps,
             'toolsJar': tools_jar,
-            'gpuClusterRecommendation': gpu_cluster_recommendation
+            'gpuClusterRecommendation': gpu_cluster_recommendation,
+            'cpuDiscount': cpu_discount,
+            'gpuDiscount': gpu_discount,
+            'globalDiscount': global_discount
         }
 
         tool_obj = QualificationAsLocal(platform_type=CspEnv.DATAPROC,
diff --git a/user_tools/src/spark_rapids_pytools/wrappers/emr_wrapper.py b/user_tools/src/spark_rapids_pytools/wrappers/emr_wrapper.py
index 65de11341..225075236 100644
--- a/user_tools/src/spark_rapids_pytools/wrappers/emr_wrapper.py
+++ b/user_tools/src/spark_rapids_pytools/wrappers/emr_wrapper.py
@@ -42,6 +42,9 @@ def qualification(cpu_cluster: str = None,
                           QualGpuClusterReshapeType.get_default()),
                       jvm_heap_size: int = 24,
                       verbose: bool = False,
+                      cpu_discount: int = None,
+                      gpu_discount: int = None,
+                      global_discount: int = None,
                       **rapids_options) -> None:
         """
         The Qualification tool analyzes Spark events generated from CPU based Spark applications to
@@ -85,6 +88,12 @@ def qualification(cpu_cluster: str = None,
                 "JOB": recommend optimal GPU cluster by cost per job
         :param jvm_heap_size: The maximum heap size of the JVM in gigabytes
         :param verbose: True or False to enable verbosity to the wrapper script
+        :param cpu_discount: A percent discount for the cpu cluster cost in the form of an integer value
+                (e.g. 30 for 30% discount).
+        :param gpu_discount: A percent discount for the gpu cluster cost in the form of an integer value
+                (e.g. 30 for 30% discount).
+        :param global_discount: A percent discount for both the cpu and gpu cluster costs in the form of an
+                integer value (e.g. 30 for 30% discount).
         :param rapids_options: A list of valid Qualification tool options.
                 Note that the wrapper ignores ["output-directory", "platform"] flags, and it does not support
                 multiple "spark-property" arguments.
@@ -112,7 +121,10 @@ def qualification(cpu_cluster: str = None,
             'eventlogs': eventlogs,
             'filterApps': filter_apps,
             'toolsJar': tools_jar,
-            'gpuClusterRecommendation': gpu_cluster_recommendation
+            'gpuClusterRecommendation': gpu_cluster_recommendation,
+            'cpuDiscount': cpu_discount,
+            'gpuDiscount': gpu_discount,
+            'globalDiscount': global_discount
         }
         QualificationAsLocal(platform_type=CspEnv.EMR,
                              cluster=None,
diff --git a/user_tools/src/spark_rapids_pytools/wrappers/onprem_wrapper.py b/user_tools/src/spark_rapids_pytools/wrappers/onprem_wrapper.py
index 1e4ea0c56..ac8bf8454 100644
--- a/user_tools/src/spark_rapids_pytools/wrappers/onprem_wrapper.py
+++ b/user_tools/src/spark_rapids_pytools/wrappers/onprem_wrapper.py
@@ -38,6 +38,9 @@ def qualification(cpu_cluster: str = None,
                           QualGpuClusterReshapeType.get_default()),
                       jvm_heap_size: int = 24,
                       verbose: bool = False,
+                      cpu_discount: int = None,
+                      gpu_discount: int = None,
+                      global_discount: int = None,
                       **rapids_options) -> None:
         """
         The Qualification tool analyzes Spark events generated from CPU based Spark applications to
@@ -65,6 +68,12 @@ def qualification(cpu_cluster: str = None,
                 "JOB": recommend optimal GPU cluster by cost per job
         :param jvm_heap_size: The maximum heap size of the JVM in gigabytes
         :param verbose: True or False to enable verbosity to the wrapper script
+        :param cpu_discount: A percent discount for the cpu cluster cost in the form of an integer value
+                (e.g. 30 for 30% discount).
+        :param gpu_discount: A percent discount for the gpu cluster cost in the form of an integer value
+                (e.g. 30 for 30% discount).
+        :param global_discount: A percent discount for both the cpu and gpu cluster costs in the form of an
+                integer value (e.g. 30 for 30% discount).
         :param rapids_options: A list of valid Qualification tool options.
                 Note that the wrapper ignores ["output-directory", "platform"] flags, and it does not support
                 multiple "spark-property" arguments.
@@ -103,7 +112,10 @@ def qualification(cpu_cluster: str = None,
             'filterApps': filter_apps,
             'toolsJar': tools_jar,
             'gpuClusterRecommendation': gpu_cluster_recommendation,
-            'targetPlatform': target_platform
+            'targetPlatform': target_platform,
+            'cpuDiscount': cpu_discount,
+            'gpuDiscount': gpu_discount,
+            'globalDiscount': global_discount
         }
         tool_obj = QualificationAsLocal(platform_type=CspEnv.ONPREM,
                                         output_folder=local_folder,
diff --git a/user_tools/src/spark_rapids_tools/cmdli/argprocessor.py b/user_tools/src/spark_rapids_tools/cmdli/argprocessor.py
index 1803f7602..8814f13cb 100644
--- a/user_tools/src/spark_rapids_tools/cmdli/argprocessor.py
+++ b/user_tools/src/spark_rapids_tools/cmdli/argprocessor.py
@@ -303,12 +303,18 @@ class QualifyUserArgModel(ToolUserArgModel):
     target_platform: Optional[CspEnv] = None
     filter_apps: Optional[QualFilterApp] = None
     gpu_cluster_recommendation: Optional[QualGpuClusterReshapeType] = None
+    cpu_discount: Optional[int] = None
+    gpu_discount: Optional[int] = None
+    global_discount: Optional[int] = None
 
     def init_tool_args(self):
         self.p_args['toolArgs']['platform'] = self.platform
         self.p_args['toolArgs']['savingsCalculations'] = True
         self.p_args['toolArgs']['filterApps'] = self.filter_apps
         self.p_args['toolArgs']['targetPlatform'] = self.target_platform
+        self.p_args['toolArgs']['cpuDiscount'] = self.cpu_discount
+        self.p_args['toolArgs']['gpuDiscount'] = self.gpu_discount
+        self.p_args['toolArgs']['globalDiscount'] = self.global_discount
         # check the reshapeType argument
         if self.gpu_cluster_recommendation is None:
             self.p_args['toolArgs']['gpuClusterRecommendation'] = QualGpuClusterReshapeType.get_default()
@@ -401,7 +407,10 @@ def build_tools_args(self) -> dict:
             'toolsJar': None,
             'gpuClusterRecommendation': self.p_args['toolArgs']['gpuClusterRecommendation'],
             # used to initialize the pricing information
-            'targetPlatform': self.p_args['toolArgs']['targetPlatform']
+            'targetPlatform': self.p_args['toolArgs']['targetPlatform'],
+            'cpuDiscount': self.p_args['toolArgs']['cpuDiscount'],
+            'gpuDiscount': self.p_args['toolArgs']['gpuDiscount'],
+            'globalDiscount': self.p_args['toolArgs']['globalDiscount']
         }
         return wrapped_args
 
diff --git a/user_tools/src/spark_rapids_tools/cmdli/tools_cli.py b/user_tools/src/spark_rapids_tools/cmdli/tools_cli.py
index 001472e36..c6ea2bc88 100644
--- a/user_tools/src/spark_rapids_tools/cmdli/tools_cli.py
+++ b/user_tools/src/spark_rapids_tools/cmdli/tools_cli.py
@@ -40,6 +40,9 @@ def qualification(self,
                       target_platform: str = None,
                       output_folder: str = None,
                       filter_apps: str = None,
+                      cpu_discount: int = None,
+                      gpu_discount: int = None,
+                      global_discount: int = None,
                       gpu_cluster_recommendation: str = QualGpuClusterReshapeType.tostring(
                           QualGpuClusterReshapeType.get_default())):
         """The Qualification cmd provides estimated running costs and speedups by migrating Apache
@@ -75,6 +78,12 @@ def qualification(self,
                 'Recommended', or 'Strongly Recommended' based on speedups. "SAVINGS"
                 lists all the apps that have positive estimated GPU savings except for the apps that
                 are "Not Applicable"
+        :param cpu_discount: A percent discount for the cpu cluster cost in the form of an integer value
+                (e.g. 30 for 30% discount).
+        :param gpu_discount: A percent discount for the gpu cluster cost in the form of an integer value
+                (e.g. 30 for 30% discount).
+        :param global_discount: A percent discount for both the cpu and gpu cluster costs in the form of an
+                integer value (e.g. 30 for 30% discount).
         :param gpu_cluster_recommendation: The type of GPU cluster recommendation to generate.
                 Requires "Cluster".
 
@@ -91,6 +100,9 @@ def qualification(self,
                                                          target_platform=target_platform,
                                                          output_folder=output_folder,
                                                          filter_apps=filter_apps,
+                                                         cpu_discount=cpu_discount,
+                                                         gpu_discount=gpu_discount,
+                                                         global_discount=global_discount,
                                                          gpu_cluster_recommendation=gpu_cluster_recommendation)
         if qual_args:
             tool_obj = QualificationAsLocal(platform_type=qual_args['runtimePlatform'],

From 26589ca3e83e8ec1cdbee498f2c2ea6fcf732c18 Mon Sep 17 00:00:00 2001
From: cindyyuanjiang <cindyj@nvidia.com>
Date: Thu, 21 Sep 2023 17:33:01 -0700
Subject: [PATCH 2/4] updated est savings cal

Signed-off-by: cindyyuanjiang <cindyj@nvidia.com>
---
 .../spark_rapids_pytools/rapids/qualification.py | 16 +++++++---------
 1 file changed, 7 insertions(+), 9 deletions(-)

diff --git a/user_tools/src/spark_rapids_pytools/rapids/qualification.py b/user_tools/src/spark_rapids_pytools/rapids/qualification.py
index b5ba44d4a..e1fc258d0 100644
--- a/user_tools/src/spark_rapids_pytools/rapids/qualification.py
+++ b/user_tools/src/spark_rapids_pytools/rapids/qualification.py
@@ -305,8 +305,8 @@ def _process_price_discount_args(self):
             gpu_discount = int(raw_gpu_discount) if raw_gpu_discount != None else 0
             global_discount = int(raw_global_discount) if raw_global_discount != None else 0
         except Exception as ex:
-            self.logger.error('Invalid arguments. Failed to process discount arguments: %s', ex)
-            raise ex
+            self.logger.error('Discount arguments have incorrect type.')
+            raise RuntimeError('Invalid arguments. Discount arguments cannot be converted to integer.')
 
         if cpu_discount < 0 or cpu_discount > 100:
             self.logger.error('cpu_discount is out of range [0, 100]')
@@ -328,9 +328,6 @@ def _process_price_discount_args(self):
             self.ctxt.set_ctxt('cpu_discount', cpu_discount)
             self.ctxt.set_ctxt('gpu_discount', gpu_discount)
 
-        self.logger.info("cpu_discount = %s", cpu_discount)
-        self.logger.info("gpu_discount = %s", gpu_discount)
-
     def _process_custom_args(self):
         """
         Qualification tool processes extra arguments:
@@ -569,10 +566,11 @@ def __calc_apps_cost(self,
                                              'savingRecommendationsRanges')
 
         def get_costs_for_single_app(df_row, estimator: SavingsEstimator) -> pd.Series:
-            cpu_cost, gpu_cost, est_savings = estimator.get_costs_and_savings(df_row['App Duration'],
-                                                                              df_row['Estimated GPU Duration'])
-            cpu_cost = (100 - self.ctxt.get_ctxt('cpu_discount')) / 100 * cpu_cost
-            gpu_cost = (100 - self.ctxt.get_ctxt('gpu_discount')) / 100 * gpu_cost
+            raw_cpu_cost, raw_gpu_cost, _ = estimator.get_costs_and_savings(df_row['App Duration'],
+                                                                            df_row['Estimated GPU Duration'])
+            cpu_cost = (100 - self.ctxt.get_ctxt('cpu_discount')) / 100 * raw_cpu_cost
+            gpu_cost = (100 - self.ctxt.get_ctxt('gpu_discount')) / 100 * raw_gpu_cost
+            est_savings = 100.0 - ((100.0 * gpu_cost) / cpu_cost)
             # We do not want to mistakenly mark a Not-applicable app as Recommended in the savings column
             if df_row[speedup_rec_col] == 'Not Applicable':
                 savings_recommendations = 'Not Applicable'

From 823cbc7040d995ed8bb1a20ff17ac049573119a1 Mon Sep 17 00:00:00 2001
From: cindyyuanjiang <cindyj@nvidia.com>
Date: Thu, 21 Sep 2023 17:46:23 -0700
Subject: [PATCH 3/4] fix python formatting issues

Signed-off-by: cindyyuanjiang <cindyj@nvidia.com>
---
 user_tools/pyproject.toml                              |  2 +-
 .../src/spark_rapids_pytools/rapids/qualification.py   | 10 +++++-----
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/user_tools/pyproject.toml b/user_tools/pyproject.toml
index 0ea4a163c..b9bb82ad8 100644
--- a/user_tools/pyproject.toml
+++ b/user_tools/pyproject.toml
@@ -41,7 +41,7 @@ dependencies = [
     "azure-storage-blob==12.17.0",
     "adlfs==2023.4.0"
 ]
-dynamic=["entry-points", "version"]
+dynamic=["version"]
 
 [project.scripts]
 spark_rapids_user_tools = "spark_rapids_pytools.wrapper:main"
diff --git a/user_tools/src/spark_rapids_pytools/rapids/qualification.py b/user_tools/src/spark_rapids_pytools/rapids/qualification.py
index e1fc258d0..493d0e30e 100644
--- a/user_tools/src/spark_rapids_pytools/rapids/qualification.py
+++ b/user_tools/src/spark_rapids_pytools/rapids/qualification.py
@@ -295,18 +295,18 @@ def _process_price_discount_args(self):
         raw_cpu_discount = self.wrapper_options.get('cpuDiscount')
         raw_gpu_discount = self.wrapper_options.get('gpuDiscount')
         raw_global_discount = self.wrapper_options.get('globalDiscount')
-        if raw_global_discount != None and (raw_cpu_discount != None or raw_gpu_discount != None):
+        if raw_global_discount is not None and (raw_cpu_discount is not None or raw_gpu_discount is not None):
             self.logger.error('Setting both global_discount and either cpu_discount or '
                               'gpu_discount is inconsistent.')
             raise RuntimeError('Invalid arguments. If global_discount is specified, no additional '
                                'discount arguments (cpu_discount or gpu_discount) should be set.')
         try:
-            cpu_discount = int(raw_cpu_discount) if raw_cpu_discount != None else 0
-            gpu_discount = int(raw_gpu_discount) if raw_gpu_discount != None else 0
-            global_discount = int(raw_global_discount) if raw_global_discount != None else 0
+            cpu_discount = int(raw_cpu_discount) if raw_cpu_discount is not None else 0
+            gpu_discount = int(raw_gpu_discount) if raw_gpu_discount is not None else 0
+            global_discount = int(raw_global_discount) if raw_global_discount is not None else 0
         except Exception as ex:
             self.logger.error('Discount arguments have incorrect type.')
-            raise RuntimeError('Invalid arguments. Discount arguments cannot be converted to integer.')
+            raise RuntimeError('Invalid arguments. Discount arguments cannot be converted to integer.') from ex
 
         if cpu_discount < 0 or cpu_discount > 100:
             self.logger.error('cpu_discount is out of range [0, 100]')

From b7e69e20dc910776c5084f3aa3d187237cfa328b Mon Sep 17 00:00:00 2001
From: cindyyuanjiang <cindyj@nvidia.com>
Date: Tue, 26 Sep 2023 11:52:17 -0700
Subject: [PATCH 4/4] removed redundant code

Signed-off-by: cindyyuanjiang <cindyj@nvidia.com>
---
 user_tools/pyproject.toml                     |  2 +-
 .../rapids/qualification.py                   | 21 ++++++++-----------
 2 files changed, 10 insertions(+), 13 deletions(-)

diff --git a/user_tools/pyproject.toml b/user_tools/pyproject.toml
index b9bb82ad8..0ea4a163c 100644
--- a/user_tools/pyproject.toml
+++ b/user_tools/pyproject.toml
@@ -41,7 +41,7 @@ dependencies = [
     "azure-storage-blob==12.17.0",
     "adlfs==2023.4.0"
 ]
-dynamic=["version"]
+dynamic=["entry-points", "version"]
 
 [project.scripts]
 spark_rapids_user_tools = "spark_rapids_pytools.wrapper:main"
diff --git a/user_tools/src/spark_rapids_pytools/rapids/qualification.py b/user_tools/src/spark_rapids_pytools/rapids/qualification.py
index 493d0e30e..fe6e10047 100644
--- a/user_tools/src/spark_rapids_pytools/rapids/qualification.py
+++ b/user_tools/src/spark_rapids_pytools/rapids/qualification.py
@@ -292,6 +292,12 @@ def __process_filter_args(self, arg_val: str):
         self.ctxt.set_ctxt('filterApps', selected_filter)
 
     def _process_price_discount_args(self):
+        def check_discount_percentage(discount_type: str, discount_value: int):
+            if discount_value < 0 or discount_value > 100:
+                self.logger.error('%s is out of range [0, 100]', discount_type)
+                raise RuntimeError(f'Invalid arguments. {discount_type} = {discount_value} is an invalid '
+                                   'percentage.')
+
         raw_cpu_discount = self.wrapper_options.get('cpuDiscount')
         raw_gpu_discount = self.wrapper_options.get('gpuDiscount')
         raw_global_discount = self.wrapper_options.get('globalDiscount')
@@ -308,18 +314,9 @@ def _process_price_discount_args(self):
             self.logger.error('Discount arguments have incorrect type.')
             raise RuntimeError('Invalid arguments. Discount arguments cannot be converted to integer.') from ex
 
-        if cpu_discount < 0 or cpu_discount > 100:
-            self.logger.error('cpu_discount is out of range [0, 100]')
-            raise RuntimeError(f'Invalid arguments. cpu_discount = {cpu_discount} is an invalid '
-                               'percentage.')
-        if gpu_discount < 0 or gpu_discount > 100:
-            self.logger.error('gpu_discount is out of range [0, 100]')
-            raise RuntimeError(f'Invalid arguments. gpu_discount = {gpu_discount} is an invalid '
-                               'percentage.')
-        if global_discount < 0 or global_discount > 100:
-            self.logger.error('global_discount is out of range [0, 100]')
-            raise RuntimeError(f'Invalid arguments. global_discount = {global_discount} is an invalid '
-                               'percentage.')
+        check_discount_percentage('cpu_discount', cpu_discount)
+        check_discount_percentage('gpu_discount', gpu_discount)
+        check_discount_percentage('global_discount', global_discount)
 
         if global_discount != 0:
             self.ctxt.set_ctxt('cpu_discount', global_discount)