Update resource_manager.py

fabriziosalmi · Aug 22, 2024 · c166628 · c166628
1 parent a9b54d3
commit c166628
Showing 1 changed file with 34 additions and 48 deletions.
diff --git a/lxc_autoscale/resource_manager.py b/lxc_autoscale/resource_manager.py
@@ -1,19 +1,12 @@
-from config import config
-import logging  # For logging events and errors
-from time import sleep  # To introduce delays in the main loop
-from lxc_utils import (  # Import various utility functions related to LXC container management
-    run_command, get_containers, is_container_running, backup_container_settings,
-    load_backup_settings, rollback_container_settings, log_json_event, get_total_cores,
-    get_total_memory, get_cpu_usage, get_memory_usage, is_ignored, get_container_data,
-    collect_container_data, prioritize_containers, get_container_config,
-    generate_unique_snapshot_name, generate_cloned_hostname
-)
-from scaling_manager import manage_horizontal_scaling, adjust_resources  # Import scaling management functions
-from notification import send_notification  # Import notification function
-from config import HORIZONTAL_SCALING_GROUPS, IGNORE_LXC, DEFAULTS  # Import configuration constants
+import config
+import logging
+from time import sleep
+import lxc_utils
+import scaling_manager
+import notification
 from concurrent.futures import ThreadPoolExecutor, as_completed
 
-def collect_data_for_container(ctid):
+def collect_data_for_container(ctid: str) -> dict:
     """
     Collect resource usage data for a single LXC container.
     
@@ -23,79 +16,72 @@ def collect_data_for_container(ctid):
     Returns:
         dict: The data collected for the container, or None if the container is not running.
     """
-    if not is_container_running(ctid):
+    if not lxc_utils.is_container_running(ctid):
         return None
 
     logging.debug(f"Collecting data for container {ctid}...")
 
     try:
-        # Retrieve the current configuration of the container
-        cores = int(run_command(f"pct config {ctid} | grep cores | awk '{{print $2}}'"))
-        memory = int(run_command(f"pct config {ctid} | grep memory | awk '{{print $2}}'"))
+        # Retrieve the current configuration of the container using Python string operations
+        config_output = lxc_utils.run_command(f"pct config {ctid}")
+        cores = int([line.split()[1] for line in config_output.splitlines() if 'cores' in line][0])
+        memory = int([line.split()[1] for line in config_output.splitlines() if 'memory' in line][0])
         settings = {"cores": cores, "memory": memory}
 
         # Backup the current settings
-        backup_container_settings(ctid, settings)
+        lxc_utils.backup_container_settings(ctid, settings)
 
         # Collect CPU and memory usage data
         return {
             ctid: {
-                "cpu": get_cpu_usage(ctid),
-                "mem": get_memory_usage(ctid),
+                "cpu": lxc_utils.get_cpu_usage(ctid),
+                "mem": lxc_utils.get_memory_usage(ctid),
                 "initial_cores": cores,
                 "initial_memory": memory,
             }
         }
+    except (ValueError, IndexError) as ve:
+        logging.error(f"Error parsing core or memory values for container {ctid}: {ve}")
+        return None
     except Exception as e:
-        logging.error(f"Error collecting data for container {ctid}: {e}")
+        logging.error(f"Error retrieving or parsing configuration for container {ctid}: {e}")
         return None
 
-def collect_container_data():
+def collect_container_data() -> dict:
     """
     Collect resource usage data for all LXC containers.
     
     Returns:
         dict: A dictionary where the keys are container IDs and the values are their respective data.
     """
     containers = {}
-    with ThreadPoolExecutor(max_workers=8) as executor:  # Adjust max_workers based on your CPU capability
-        futures = {executor.submit(collect_data_for_container, ctid): ctid for ctid in get_containers()}
+    with ThreadPoolExecutor(max_workers=8) as executor:
+        futures = {executor.submit(collect_data_for_container, ctid): ctid for ctid in lxc_utils.get_containers()}
         for future in as_completed(futures):
-            container_data = future.result()
-            if container_data:
-                containers.update(container_data)
+            try:
+                container_data = future.result()
+                if container_data:
+                    containers.update(container_data)
+            except Exception as e:
+                logging.error(f"Error collecting data for a container: {e}")
     return containers
 
-
-
-
-
-def main_loop(poll_interval, energy_mode):
+def main_loop(poll_interval: int, energy_mode: bool):
     """
     Main loop that handles the resource allocation and scaling process.
     
     Args:
         poll_interval (int): The interval in seconds between each resource allocation process.
         energy_mode (bool): A flag to indicate if energy efficiency mode should be enabled during off-peak hours.
     """
-    running = True
-    while running:
+    while True:
         logging.info("Starting resource allocation process...")
         try:
-            # Collect data for all containers
             containers = collect_container_data()
-
-            # Adjust resources based on collected data
-            adjust_resources(containers, energy_mode)
-
-            # Manage horizontal scaling groups
-            manage_horizontal_scaling(containers)
-
+            scaling_manager.adjust_resources(containers, energy_mode)
+            scaling_manager.manage_horizontal_scaling(containers)
             logging.info(f"Resource allocation process completed. Next run in {poll_interval} seconds.")
-
-            # Sleep until the next polling interval
-            sleep(poll_interval)
         except Exception as e:
-            # If an error occurs, log it and exit the loop
             logging.error(f"Error in main loop: {e}")
-            running = False
+            # Optional: consider if you want the loop to continue or handle certain errors more gracefully.
+        sleep(poll_interval)