From 731fc16bbc9c378ae662a72aef62a18f098c4bba Mon Sep 17 00:00:00 2001 From: git-hyagi <45576767+git-hyagi@users.noreply.github.com> Date: Wed, 8 Jan 2025 15:21:41 -0300 Subject: [PATCH] Add a tool to visualize the tasking system ref: PULP-241 --- management_tools/Dockerfile | 9 ++ management_tools/README.md | 78 +++++++++++ management_tools/gnuplot-script | 23 ++++ management_tools/tasks-cli.py | 231 ++++++++++++++++++++++++++++++++ 4 files changed, 341 insertions(+) create mode 100644 management_tools/Dockerfile create mode 100644 management_tools/README.md create mode 100644 management_tools/gnuplot-script create mode 100644 management_tools/tasks-cli.py diff --git a/management_tools/Dockerfile b/management_tools/Dockerfile new file mode 100644 index 0000000..b0c8863 --- /dev/null +++ b/management_tools/Dockerfile @@ -0,0 +1,9 @@ +FROM registry.fedoraproject.org/fedora-minimal:39 + +RUN microdnf install -y pip gnuplot && microdnf clean all +RUN pip install requests && rm -rf /root/.cache/pip + +COPY gnuplot-script . +COPY tasks-cli.py . + +CMD ["python", "tasks-cli.py"] diff --git a/management_tools/README.md b/management_tools/README.md new file mode 100644 index 0000000..f74f5f4 --- /dev/null +++ b/management_tools/README.md @@ -0,0 +1,78 @@ +# RUNNING FROM SOURCE + +* installing dependencies +``` +sudo dnf install -y gnuplot +pip install requests +``` + +* [optional] create a folder to output the data (or set the -o/--output when running tasks-cli command) +``` +mkdir /tmp/tasks-cli +``` + +* running + + ``` + cd management_tools + ``` + + * stage + ``` + HTTPS_PROXY=http://squid.corp.redhat.com:3128 python tasks-cli.py -c -k --base_address https://mtls.internal.console.stage.redhat.com + ``` + + * prod + ``` + python tasks-cli.py -c -k --base_address https://mtls.internal.console.redhat.com + ``` + +A new graph file will be created with the definition from `--graph_file` (if not provided the default value is `/tmp/tasks-cli/graph_tasks.ps`). + + +# RUNNING AS A CONTAINER + +* building +``` +cd management_tools/ +podman build -t tasks-cli:latest . +``` + +* create a folder to output the data +``` +mkdir /tmp/tasks-cli +``` + +* running + * ephemeral + ``` + podman run -v /tmp/tasks-cli:/tmp/tasks-cli -it --rm tasks-cli python tasks-cli.py \ + --base_address http://$(oc get routes pulp-api -ojsonpath='{.spec.host}') \ + --password $(oc extract secret/pulp-admin-password --to=-) \ + --output /tmp/tasks-cli/test.out \ + -g /tmp/tasks-cli/graph.ps + ``` + + * stage + ``` + podman run -v :/tmp/cert-dir/ -v /tmp/tasks-cli:/tmp/tasks-cli -it --rm tasks-cli HTTPS_PROXY=http://squid.corp.redhat.com:3128 python tasks-cli.py \ + --period 2 --bucket_size 600 \ + --base_address https://mtls.internal.console.stage.redhat.com \ + -c /tmp/cert-dir/ \ + -k /tmp/cert-dir/ \ + --output /tmp/tasks-cli/ \ + -g /tmp/tasks-cli/ + ``` + + * prod + ``` + podman run -v :/tmp/cert-dir/ -v /tmp/tasks-cli:/tmp/tasks-cli -it --rm tasks-cli python tasks-cli.py \ + --period 2 --bucket_size 600 \ + --base_address https://mtls.internal.console.redhat.com \ + -c /tmp/cert-dir/ \ + -k /tmp/cert-dir/ \ + --output /tmp/tasks-cli/ \ + -g /tmp/tasks-cli/ + ``` + +A new graph file will be created with the definition from `--graph_file` (if not provided the default value is `/tmp/tasks-cli/graph_tasks.ps`). diff --git a/management_tools/gnuplot-script b/management_tools/gnuplot-script new file mode 100644 index 0000000..ed53d3f --- /dev/null +++ b/management_tools/gnuplot-script @@ -0,0 +1,23 @@ +#set xlabel "Values" +set title "Tasks" +set terminal postscript enhanced color landscape +set output graph_file + +#set xdata time +#set timefmt "%Y-%m-%dT%H:%M:%S.%zZ" +#set style data lines + +set style data histogram +set style histogram rowstacked +set boxwidth 0.75 +#set style histogram cluster gap 1 +set style fill solid 1.0 border -1.0 # Fill style for the boxes + +# Fine control of the major (labelled) tics on the x axis +set xtics rotate by -90 +set grid ytics lt rgb "gray" + +#plot "/tmp/a" u 1:2 +plot data_file using 2:xtic(1) ti 'runing' lt rgb 'green', '' using 3 ti 'waiting blocked' lt rgb 'red', '' using 4 ti 'waiting unblocked' lt rgb 'blue' + +#pause -1 diff --git a/management_tools/tasks-cli.py b/management_tools/tasks-cli.py new file mode 100644 index 0000000..60195ae --- /dev/null +++ b/management_tools/tasks-cli.py @@ -0,0 +1,231 @@ +import argparse +import json +import os +import requests +import subprocess +import sys + +from datetime import datetime, timedelta +from types import SimpleNamespace + + +DATETIME_FORMAT = "%Y-%m-%dT%H:%M:%S.%fZ" +TASKS_ENDPOINT = "/api/pulp/admin/tasks/?fields=pulp_created&" + +QUERY_TYPES = SimpleNamespace( + RUNNING="running", + WAITING_UNBLOCKED="waiting_unblocked", + WAITING_BLOCKED="waiting_blocked", +) + +parser = argparse.ArgumentParser() +parser.add_argument( + "-b", + "--base_address", + help="Pulp hostname address. For example: http://pulp-service:5001", +) +parser.add_argument( + "-u", + "--username", + help="Pulp user to run the API requests. [DEFAULT: admin]", + default="admin", +) +parser.add_argument("-p", "--password", help="Password for Pulp user.") +parser.add_argument( + "-c", "--certificate", help="Certificate to authenticate to Pulp API." +) +parser.add_argument( + "-k", "--key", help="Private key for the certificate authentication." +) +parser.add_argument( + "--period", + help="Period, in hours, to check the tasks. For example, for the last 24 hours: --period=24 [DEFAULT: 2]", + type=int, + default=2, +) +parser.add_argument( + "--bucket_size", + help="Bucket size, in seconds. For example, for a 30 seconds bucket: --bucket-size=30 [DEFAULT: 600]", + type=int, + default=600, +) +parser.add_argument( + "-o", + "--output", + help="Output file with the metrics. [DEFAULT: /tmp/tasks-cli/pulp_tasks.out]", + type=str, + default="/tmp/tasks-cli/pulp_tasks.out", +) +parser.add_argument( + "-g", + "--graph_file", + help="Gnuplot output file. [DEFAULT: /tmp/tasks-cli/graph_tasks.ps]", + type=str, + default="/tmp/tasks-cli/graph_tasks.ps", +) + +args = parser.parse_args() + +base_addr = args.base_address +username = args.username +password = args.password +pulp_certificate = args.certificate +pulp_cert_key = args.key +period_in_hours = args.period +bucket_size_in_seconds = args.bucket_size +output_file = args.output +graph_file = args.graph_file + + +def run(): + + datetime_now = datetime.now() + query_date_time = datetime_now - timedelta(hours=period_in_hours) + start_date = query_date_time.strftime(DATETIME_FORMAT) + data = initialize_response_structure( + period_in_hours, bucket_size_in_seconds, query_date_time + ) + + for task_state in QUERY_TYPES.__dict__.values(): + tasks = get_tasks(start_date, task_state) + make_buckets( + tasks, + bucket_size_in_seconds, + query_date_time, + period_in_hours, + task_state, + data, + ) + + write_to_file(data) + p = subprocess.Popen( + "gnuplot -e \"data_file='" + + output_file + + "'\" -e \"graph_file='" + + graph_file + + "'\" -c gnuplot-script", + shell=True, + ) + os.waitpid(p.pid, 0) + + +def write_to_file(data): + try: + with open(output_file, "w") as f: + for key in data: + print( + key, + data[key][QUERY_TYPES.RUNNING], + data[key][QUERY_TYPES.WAITING_BLOCKED], + data[key][QUERY_TYPES.WAITING_UNBLOCKED], + ) + f.write( + key + + " " + + str(data[key][QUERY_TYPES.RUNNING]) + + " " + + str(data[key][QUERY_TYPES.WAITING_BLOCKED]) + + " " + + str(data[key][QUERY_TYPES.WAITING_UNBLOCKED]) + + "\n" + ) + except FileNotFoundError: + dirname = os.path.dirname(os.path.abspath(output_file)) + print(dirname, "not found!") + print( + 'Make sure', + dirname, + 'exists or set a different path for the output (tasks-cli -o/--output )', + ) + sys.exit(2) + + +def get_tasks(start_date, query_type=None): + url = base_addr + TASKS_ENDPOINT + "started_at__gte=" + start_date + if query_type == QUERY_TYPES.RUNNING: + url = running_tasks_url(start_date) + elif query_type == QUERY_TYPES.WAITING_UNBLOCKED: + url = tasks_in_waiting_state_and_unblocked_url(False) + elif query_type == QUERY_TYPES.WAITING_BLOCKED: + url = tasks_in_waiting_state_and_unblocked_url(True) + + if pulp_certificate: + response = requests.get(url, cert=(pulp_certificate, pulp_cert_key)) + else: + response = requests.get(url, auth=(username, password)) + + if response.status_code // 100 != 2: + print("ERROR:", response.status_code, response.text) + sys.exit(1) + + response_json = json.loads(response.text) + + tasks_found_datetime = [] + if response_json.get("results"): + for result in response_json["results"]: + tasks_found_datetime.append(result["pulp_created"]) + + return tasks_found_datetime + + +def initialize_response_structure(period, bucket_size, query_date_time): + data = {} + total_seconds = timedelta(hours=period).total_seconds() + number_of_intervals = int(total_seconds // bucket_size) + + # Create a list of bucket start times + bucket_starts = [ + query_date_time + timedelta(seconds=i * bucket_size) + for i in range(number_of_intervals) + ] + + # Initialize buckets + for start_time in bucket_starts: + data[start_time.strftime(DATETIME_FORMAT)] = {} + for task_state in QUERY_TYPES.__dict__.values(): + data[start_time.strftime(DATETIME_FORMAT)][task_state] = 0 + + return data + + +def make_buckets( + tasks_found_datetime, bucket_size, query_date_time, period, query_type, data +): + if tasks_found_datetime == [None]: + return data + + total_seconds = timedelta(hours=period).total_seconds() + number_of_intervals = int(total_seconds // bucket_size) + + # Count tasks in each bucket + for task_datetime_str in tasks_found_datetime: + task_datetime = datetime.strptime(task_datetime_str, DATETIME_FORMAT) + + # Find the appropriate bucket for the task + for i in range(number_of_intervals): + start_time = query_date_time + timedelta(seconds=i * bucket_size) + end_time = start_time + timedelta(seconds=bucket_size) + + if start_time < task_datetime < end_time: + data[start_time.strftime(DATETIME_FORMAT)][query_type] += 1 + break # Task is counted, no need to check further + + return data + + +def running_tasks_url(start_date): + return ( + base_addr + TASKS_ENDPOINT + "started_at__gte=" + start_date + "&state=running" + ) + + +def tasks_in_waiting_state_and_unblocked_url(unblocked_null): + return ( + base_addr + + TASKS_ENDPOINT + + "&state=waiting&unblocked_at__isnull=" + + str(unblocked_null) + ) + + +run()