Fix benchmark memory issues

Altinity · Oct 24, 2024 · 671afe0 · 671afe0
1 parent 50a1165
commit 671afe0
Showing 1 changed file with 6 additions and 2 deletions.
diff --git a/ontime_benchmark/tests/benchmark.py b/ontime_benchmark/tests/benchmark.py
@@ -15,7 +15,11 @@ def insert_ontime_data(self, from_year, to_year, table_name, node=None):
         node = self.context.node
 
     node.query(
-        f"INSERT INTO {table_name} SELECT * FROM s3('https://clickhouse-public-datasets.s3.amazonaws.com/ontime/csv_by_year/{{{from_year}..{to_year}}}.csv.gz', CSVWithNames) SETTINGS max_insert_threads = 20, receive_timeout=600, max_memory_usage=0;",
+        f"INSERT INTO {table_name} "
+        f"SELECT * FROM s3('https://clickhouse-public-datasets.s3.amazonaws.com/ontime/csv_by_year/{{{from_year}..{to_year}}}.csv.gz', CSVWithNames) "
+        "SETTINGS receive_timeout=600, "
+        "max_insert_threads=10, "  # This affects memory more than it affects performance
+        "max_memory_usage=29500000000;",  # Runners have about this much available memory
         timeout=1200,
     )
 
@@ -186,7 +190,7 @@ def run_benchmark(num):
                 start_year = 2007
                 end_year = 2012
 
-            for retry in retries(timeout=60, delay=0.1):
+            for retry in retries(timeout=60, delay=1):
                 with retry:
                     Step(
                         name=f"insert data from {start_year} to {end_year} into ontime table",