From a8f3342ad117ade955d03b794c043d29feeb4848 Mon Sep 17 00:00:00 2001 From: KarthikL1729 Date: Wed, 30 Oct 2024 20:34:01 +0530 Subject: [PATCH] Added the mapper tool to map trace to vSwarm proxies. Added documentation for the mapper tool. Signed-off-by: KarthikL1729 --- .github/configs/wordlist.txt | 17 +- docs/mapper.md | 88 ++++++++++ tools/mapper/.gitattributes | 1 + tools/mapper/find_proxy_function.py | 252 ++++++++++++++++++++++++++++ tools/mapper/log_config.py | 37 ++++ tools/mapper/mapper.py | 147 ++++++++++++++++ tools/mapper/profile.tar.gz | 3 + 7 files changed, 544 insertions(+), 1 deletion(-) create mode 100644 docs/mapper.md create mode 100644 tools/mapper/.gitattributes create mode 100644 tools/mapper/find_proxy_function.py create mode 100644 tools/mapper/log_config.py create mode 100644 tools/mapper/mapper.py create mode 100644 tools/mapper/profile.tar.gz diff --git a/.github/configs/wordlist.txt b/.github/configs/wordlist.txt index 2f81774e6..579902810 100644 --- a/.github/configs/wordlist.txt +++ b/.github/configs/wordlist.txt @@ -771,4 +771,19 @@ autoscaler FailAt FailComponent FailNode -FailureEnabled \ No newline at end of file +FailureEnabled +DIRECTORYPATH +FILEPATH +directorypath +filepath +HashApp +HashFunction +HashOwner +AverageAllocatedMb +SampleCount +Jonker +Pipelined +SciPy +Volgenant +injective +py \ No newline at end of file diff --git a/docs/mapper.md b/docs/mapper.md new file mode 100644 index 000000000..30171e53b --- /dev/null +++ b/docs/mapper.md @@ -0,0 +1,88 @@ +# Mapper + +The mapper tool can be used to map the functions in a given trace directory (with memory and duration traces) to the proxy functions in the [`vSwarm`](https://github.com/vhive-serverless/vSwarm/tree/main/) benchmark suite. The benchmarks present in the vSwarm benchmark suite have been profiled and their memory utilization and duration traces have been collected and stored in the `profile.json` file. Each function in the trace is mapped to a function in the benchmark suite as its closest proxy (based on memory and duration correlation). + +The `profile.json` JSON output file is generated by the [`profiler` tool](https://github.com/vhive-serverless/vSwarm/tree/load-generator/tools/profiler#profiler) to obtain the profile of the benchmark suite functions. + +### Usage + +```bash +usage: mapper.py [-h] -t TRACE_DIRECTORYPATH -p PROFILE_FILEPATH [-o OUTPUT_FILEPATH] [-u UNIQUE_ASSIGNMENT] + +Arguments: + -h, --help show this help message and exit + -t TRACE_DIRECTORYPATH, --trace-directorypath TRACE_DIRECTORYPATH + Path to the directory containing the trace files (required) + -p PROFILE_FILEPATH, --profile-filepath PROFILE_FILEPATH + Path to the profile file containing the proxy functions + -u UNIQUE_ASSIGNMENT, --unique-assignment UNIQUE_ASSIGNMENT + Whether to assign unique proxy functions to each trace function +``` +The tool reads the trace information(memory and duration details) from the `trace/` directory (can be configured using `-t` or `--trace-directorypath` flags). The `trace/` directory must contain the `memory.csv` and `durations.csv` files containing the respective trace information of the format mentioned in [*Azure Functions Dataset 2019*](https://github.com/Azure/AzurePublicDataset/blob/master/AzureFunctionsDataset2019.md) + +#### Function Execution Duration `durations.csv` Schema + +|Field|Description | +|--|--| +| HashOwner | unique id of the application owner | +| HashApp | unique id for application name | +| HashFunction | unique id for the function name within the app | +|Average | Average execution time (ms) across all invocations of the 24-period| +|Count | Number of executions used in computing the average| +|Minimum | Minimum execution time| +|Maximum | Maximum execution time| +|percentile_Average_0| Weighted 0th-percentile of the execution time *average*| +|percentile_Average_1| Weighted 1st-percentile of the execution time *average*| +|percentile_Average_25 | Weighted 25th-percentile of the execution time *average*| +|percentile_Average_50 | Weighted 50th-percentile of the execution time *average*| +|percentile_Average_75 | Weighted 75th-percentile of the execution time *average*| +|percentile_Average_99 | Weighted 99th-percentile of the execution time *average*| +|percentile_Average_100 | Weighted 100th-percentile of the execution time *average*| +Execution time is in milliseconds. + +#### Function Memory Usage `memory.csv` Schema + +|Field|Description | +|--|--| +| HashOwner | unique id of the application owner | +| HashApp | unique id for application name | +| HashFunction | unique id for the function name within the app | +|SampleCount | Number of samples used for computing the average | +|AverageAllocatedMb | Average allocated memory across all SampleCount measurements| +|AverageAllocatedMb_pct1 | 1st percentile of the average allocated memory| +|AverageAllocatedMb_pct5 | 5th percentile of the average allocated memory| +|AverageAllocatedMb_pct25 | 25th percentile of the average allocated memory| +|AverageAllocatedMb_pct50 | 50th percentile of the average allocated memory| +|AverageAllocatedMb_pct75 | 75th percentile of the average allocated memory| +|AverageAllocatedMb_pct95 | 95th percentile of the average allocated memory| +|AverageAllocatedMb_pct99 | 99th percentile of the average allocated memory| +|AverageAllocatedMb_pct100 | 100th percentile of the average allocated memory| + +The [`sampler`](https://github.com/vhive-serverless/invitro/tree/main/sampler) tool in InVitro can be used to generate the sampled traces from the original Azure traces. + +For every function in the trace, the closest function in the [`vSwarm`](https://github.com/vhive-serverless/vSwarm/tree/main/) benchmark suite is set as its proxy (75-percentile memory and 75-percentile duration are considered to find the highest correlation). If the `-u` (or `--unique-assignment`) flag is set to true, the tool tries to find a one-to-one (injective) mapping between trace functions and proxy functions by modelling it as a *linear sum assignment* problem which is solved by the SciPy implementation of the *Jonker-Volgenant algorithm*. The 75th percentile is used to ensure that the mapping is not only corresponding to the peak values of the workload, but is also leading to a representative proxy function. If the number of trace functions is greater than the number of proxy functions, or if the mapping is not achieved, the injective constraint is removed, and the closest proxy function is obtained. Currently the tool utilizes only _Serving Functions_ that are _NOT Pipelined_ as proxy functions. + +This mapping requires the profiles of the benchmark functions for it to be used as a proxy. The tool utilizes the `profile.json` JSON output file generated by the [`profiler` tool](https://github.com/vhive-serverless/vSwarm/tree/load-generator/tools/profiler#profiler) to obtain the profile of the benchmark suite functions. The User can configure the path of the JSON file through the `-p` (or `--profile-filepath`) flag (by default, it is `profile.json`, which needs to be unzipped). + +An example of a generated output file is as follows: + +```json +{ + "c13acdc7567b225971cef2416a3a2b03c8a4d8d154df48afe75834e2f5c59ddf": { + "proxy-function": "video-processing-python-10" + }, + "a2faad786b3c813b12ce57d349d5e62f6d0f22ceecfa86cd72a962853383b600": { + "proxy-function": "image-rotate-go-11" + }, + "7dc5aeabc131669912e8c793c8925cc9928321f45f13a4af031592b4611630d7": { + "proxy-function": "video-processing-python-70" + }, + "ae8a1640fa932024f59b38a0b001808b5c64612bd60c6f3eb80ba9461ba2d091": { + "proxy-function": "video-processing-python-20" + } +} +``` + +The mapper output file will be stored in the trace directory with the name `mapper_output.json` by default. The output file contains the mapping of the trace functions to the proxy functions in the vSwarm benchmark suite. + +--- \ No newline at end of file diff --git a/tools/mapper/.gitattributes b/tools/mapper/.gitattributes new file mode 100644 index 000000000..aa0e5878c --- /dev/null +++ b/tools/mapper/.gitattributes @@ -0,0 +1 @@ +profile.tar.gz filter=lfs diff=lfs merge=lfs -text diff --git a/tools/mapper/find_proxy_function.py b/tools/mapper/find_proxy_function.py new file mode 100644 index 000000000..5f475ebea --- /dev/null +++ b/tools/mapper/find_proxy_function.py @@ -0,0 +1,252 @@ +import numpy as np +import scipy.optimize as sp +import math + +from collections import OrderedDict + +from log_config import * +from typing import Tuple + +def get_error(trace_function, proxy_function) -> float: + """ + Returns a float value on how close the trace function is to the proxy function. Lower the value, better the correlation. + Euclidean distance between normalized memory and duration is considered. + + Parameters: + - `trace_function` (dict): Dictionary containing information regarding trace function + - `proxy_function` (dict): Dictionary containing information regarding proxy function + + Returns: + - `float`: closeness value + """ + + try: + trace_memory = trace_function["memory"]["75-percentile"] + proxy_memory = proxy_function["memory"]["75-percentile"] + trace_duration = trace_function["duration"]["75-percentile"] + proxy_duration = proxy_function["duration"]["75-percentile"] + except KeyError as e: + log.warning(f"Correlation cannot be found. Error: {e}") + return math.inf + + # NOTE: Better Error mechanisms can be considered to improve the correlation + # Currently only the 75%tile memory and duration are considered. + # Euclidean distance between normalized memory and duration is considered + try: + if trace_memory == 0: trace_memory += 0.01 + if trace_duration == 0: trace_duration += 0.01 + diff_memory = (math.log(trace_memory) - math.log(proxy_memory)) + diff_duration = (math.log(trace_duration) - math.log(proxy_duration)) + error = math.sqrt((diff_memory) ** 2 + (diff_duration) ** 2) + return error + except ValueError as e: + log.warning(f"Correlation cannot be found. Error: {e}") + return math.inf + + +def get_proxy_function_using_linear_sum_assignment( + trace_functions: dict, proxy_functions: dict +) -> Tuple[dict, int]: + """ + Obtains the one-to-one mapped proxy function for every trace function + + Parameters: + - `trace_functions` (dict): Dictionary containing information regarding trace functions + - `proxy_functions` (dict): Dictionary containing information regarding proxy functions + + Returns: + - `dict`: Dictionary containing information regarding trace functions with the associated proxy functions + - `int`: 0 if no error. -1 if error + """ + + try: + + trace_functions = OrderedDict(trace_functions) + proxy_functions = OrderedDict(proxy_functions) + + trace_list = [] + for tf in trace_functions: + trace_list.append(trace_functions[tf]) + trace_functions[tf]["index"] = len(trace_list) - 1 + + proxy_list = [] + for pf in proxy_functions: + proxy_list.append(proxy_functions[pf]) + proxy_functions[pf]["index"] = len(proxy_list) - 1 + + # Creating error matrix + m, n = len(trace_functions.keys()), len(proxy_functions.keys()) + error_matrix = np.empty((m, n)) + + # This utilized Jonker-Volgenant algorithm for Linear Sum assignment - scipy package + # to calculate the best possible assignment for the trace functions + # Time complexity : O(n^3) where n is the largest of number of rows/columns + for i in range(m): + for j in range(n): + error_matrix[i, j] = get_error(trace_list[i], proxy_list[j]) + + # Do the linear sum assignment problem + row_indices, col_indices = sp.linear_sum_assignment(error_matrix) + assignments = list(zip(row_indices, col_indices)) + + # Go through the assignment solution + for assignment in assignments: + row_index = assignment[0] + col_index = assignment[1] + trace = "" + proxy = "" + for tf in trace_functions: + if row_index == trace_functions[tf]["index"]: + trace = tf + break + for pf in proxy_functions: + if col_index == proxy_functions[pf]["index"]: + proxy = pf + break + trace_functions[trace]["proxy-function"] = proxy + trace_functions[trace]["proxy-correlation"] = get_error( + trace_functions[trace], proxy_functions[proxy] + ) + log.debug( + f"Found proxy function for {trace}: {trace_functions[trace]['proxy-function']} with correlation: {trace_functions[trace]['proxy-correlation']}" + ) + + # Go through the trace functions to ensure proxy function exists. If not, then report + for tf in trace_functions: + if "proxy-function" not in trace_functions[tf]: + log.warning(f"Mapping for function {tf} not found") + elif trace_functions[tf]["proxy-function"] == "": + log.warning(f"Mapping for function {tf} not found") + + # Deleting unnecessary stuffs + for tf in trace_functions: + del trace_functions[tf]["index"] + for pf in proxy_functions: + del proxy_functions[pf]["index"] + + return trace_functions, 0 + + except Exception as e: + log.error(f"Mapping through linear sum assignment failed. Error: {e}") + return trace_functions, -1 + + +def get_closest_proxy_function( + trace_functions: dict, proxy_functions: dict +) -> Tuple[dict, int]: + """ + Obtains the closest proxy function for every trace function + + Parameters: + - `trace_functions` (dict): Dictionary containing information regarding trace functions + - `proxy_functions` (dict): Dictionary containing information regarding proxy functions + + Returns: + - `dict`: Dictionary containing information regarding trace functions with the associated proxy functions + - `int`: 0 if no error. -1 if error + """ + + try: + proxy_list = [] + for function_name in proxy_functions: + proxy_list.append(proxy_functions[function_name]) + proxy_functions[function_name]["index"] = len(proxy_list) - 1 + + for function_name in trace_functions: + min_error = math.inf + min_error_index = -1 + for i in range(0, len(proxy_list)): + error = get_error(trace_functions[function_name], proxy_list[i]) + if error < min_error: + min_error = error + min_error_index = i + + if min_error == math.inf: + log.warning(f"Proxy function for function {function_name} not found") + continue + + trace_functions[function_name]["proxy-function"] = proxy_list[ + min_error_index + ]["name"] + trace_functions[function_name]["proxy-correlation"] = get_error( + trace_functions[function_name], proxy_list[min_error_index] + ) + log.debug( + f"Found proxy function for {function_name}: {trace_functions[function_name]['proxy-function']} with correlation: {trace_functions[function_name]['proxy-correlation']}" + ) + + for function_name in proxy_functions: + del proxy_functions[function_name]["index"] + + return trace_functions, 0 + + except Exception as e: + log.error(f"Finding closest proxy function failed. Error: {e}") + return trace_functions, -1 + + +def get_proxy_function( + trace_functions: dict, proxy_functions: dict, unique_assignment: bool +) -> Tuple[dict, int]: + """ + Obtains the closest proxy function for every trace function + + Parameters: + - `trace_functions` (dict): Dictionary containing information regarding trace functions + - `proxy_functions` (dict): Dictionary containing information regarding proxy functions + - `unique_assignment` (bool): If `True`, then trace-proxy function mapping is one-to-one, provided #(proxy functions) > #(trace functions) + + Returns: + - `dict`: Dictionary containing information regarding trace functions with the associated proxy functions + - `int`: 0 if no error. -1 if error + """ + + trace_functions = OrderedDict(trace_functions) + proxy_functions = OrderedDict(proxy_functions) + + log.info( + f"Lower the correlation value, the proxy function is a better proxy of the trace function" + ) + + if (unique_assignment) and (len(trace_functions) <= len(proxy_functions)): + log.info( + f"Getting One-To-One mapping between trace function and proxy function using Linear-Sum-Assignment" + ) + trace_functions, err = get_proxy_function_using_linear_sum_assignment( + trace_functions=trace_functions, proxy_functions=proxy_functions + ) + if err == -1: + log.error( + f"One-To-One mapping between trace function and proxy function not obtained" + ) + log.info( + f"Getting closest proxy function for every trace function. Note: Mapping may not be unique" + ) + trace_functions, err = get_closest_proxy_function( + trace_functions=trace_functions, proxy_functions=proxy_functions + ) + + elif (unique_assignment) and (len(trace_functions) > len(proxy_functions)): + log.warning( + f"One-To-One mapping between trace function and proxy function not possible since number of trace functions is greater than available proxy functions" + ) + log.info( + f"Getting closest proxy function for every trace function. Note: Mapping may not be unique" + ) + trace_functions, err = get_closest_proxy_function( + trace_functions=trace_functions, proxy_functions=proxy_functions + ) + + else: + log.info( + f"Getting closest proxy function for every trace function. Note: Mapping may not be unique" + ) + trace_functions, err = get_closest_proxy_function( + trace_functions=trace_functions, proxy_functions=proxy_functions + ) + + if err == -1: + log.critical(f"Mapping between trace function and proxy function not obtained") + return trace_functions, -1 + + return trace_functions, 0 \ No newline at end of file diff --git a/tools/mapper/log_config.py b/tools/mapper/log_config.py new file mode 100644 index 000000000..80437075b --- /dev/null +++ b/tools/mapper/log_config.py @@ -0,0 +1,37 @@ +import logging + +class CustomFormatter(logging.Formatter): + + blue = "\x1b[34;20m" + green = "\x1b[32;20m" + grey = "\x1b[38;20m" + yellow = "\x1b[33;20m" + red = "\x1b[31;20m" + bold_red = "\x1b[31;1m" + bold_red_white_bg = "\x1b[1;37;41m" + reset = "\x1b[0m" + format = "%(asctime)s - %(levelname)s - (%(filename)s:%(lineno)d) - %(message)s" + + FORMATS = { + logging.DEBUG: grey + format + reset, + logging.INFO: green + format + reset, + logging.WARNING: yellow + format + reset, + logging.ERROR: red + format + reset, + logging.CRITICAL: bold_red_white_bg + format + reset, + } + + def format(self, record): + log_fmt = self.FORMATS.get(record.levelno) + formatter = logging.Formatter(log_fmt) + return formatter.format(record) + + +log = logging.getLogger("Benchmark") +log.setLevel(logging.INFO) +ch = logging.StreamHandler() +ch.setFormatter(CustomFormatter()) +log.addHandler(ch) + +def setLogLevel(level: str) -> None: + if (level == "INFO"): log.setLevel(logging.INFO) + elif (level == "DEBUG"): log.setLevel(logging.DEBUG) \ No newline at end of file diff --git a/tools/mapper/mapper.py b/tools/mapper/mapper.py new file mode 100644 index 000000000..71e5299d0 --- /dev/null +++ b/tools/mapper/mapper.py @@ -0,0 +1,147 @@ +import os + +import json +import re +import argparse +import pandas as pd +from find_proxy_function import * + +from log_config import * + +def load_trace(trace_directorypath): + duration_info = {} + memory_info = {} + # Read the trace files and store the information + + # Read the durations file + duration_filepath = trace_directorypath + "/durations.csv" + if os.path.exists(duration_filepath): + log.info(f"Durations file {duration_filepath} exists. Accessing information") + try: + duration_info = pd.read_csv(duration_filepath) + except Exception as e: + log.critical( + f"Durations file {duration_filepath} cannot be read. Error: {e}" + ) + return None, -1 + + # Read the memory file + memory_filepath = trace_directorypath + "/memory.csv" + if os.path.exists(memory_filepath): + log.info(f"Memory file {memory_filepath} exists. Accessing information") + try: + memory_info = pd.read_csv(memory_filepath) + except Exception as e: + log.critical( + f"Memory file {memory_filepath} cannot be read. Error: {e}" + ) + return None, -1 + + # Rename all columns in the dataframe with a lambda (for example: percentile_Average_1 -> 1-percentile) if x matches a regex + duration_info = duration_info.rename(columns=lambda x: re.sub(r'percentile_(\w+)_(\d+)', r'\2-' + "percentile", x)) + # Rename all columns in the dataframe with a lambda (for example: AverageAllocatedMb_pct1 -> 1-percentile) if x matches a regex + memory_info = memory_info.rename(columns=lambda x: re.sub(r'AverageAllocatedMb_pct(\w+)', r'\1-' + "percentile", x)) + + # Add them to a dict with the key being the HashFunction + trace_functions = {} + + for _, row in duration_info.iterrows(): + hash_function = row["HashFunction"] + trace_functions[hash_function] = {} + trace_functions[hash_function]["duration"] = row + + for _, row in memory_info.iterrows(): + hash_function = row["HashFunction"] + trace_functions[hash_function]["memory"] = row + + return trace_functions, 0 + +def main(): + # Parse the arguments + parser = argparse.ArgumentParser(description="Mapper") + parser.add_argument( + "-t", + "--trace-directorypath", + type=str, + help="Path to the directory containing the trace files", + required=True, + ) + parser.add_argument( + "-p", + "--profile-filepath", + type=str, + help="Path to the profile file containing the proxy functions", + required=True, + ) + parser.add_argument( + "-u", + "--unique-assignment", + type=bool, + help="Whether to assign unique proxy functions to each trace function", + default=False, + required=False, + ) + args = parser.parse_args() + trace_directorypath = args.trace_directorypath + profile_filepath = args.profile_filepath + output_filepath = trace_directorypath + "/mapper_output.json" + unique_assignment = args.unique_assignment + trace_functions, err = load_trace(trace_directorypath) + if err == -1: + log.critical(f"Load Generation failed") + return + elif err == 0: + log.info(f"Trace loaded") + + ## Check whether the profile file for proxy functions exists or not + if os.path.exists(profile_filepath): + log.info( + f"Profile file for proxy functions {profile_filepath} exists. Accessing information" + ) + try: + with open(profile_filepath, "r") as jf: + proxy_functions = json.load(jf) + except Exception as e: + log.critical( + f"Profile file for proxy functions {profile_filepath} cannot be read. Error: {e}" + ) + log.critical(f"Load Generation failed") + return + else: + log.critical(f"Profile file for proxy functions {profile_filepath} not found") + log.critical(f"Load Generation failed") + return + + # Getting a proxy function for every trace function + trace_functions, err = get_proxy_function( + trace_functions=trace_functions, + proxy_functions=proxy_functions, + unique_assignment=unique_assignment, + ) + if err == -1: + log.critical(f"Load Generation failed") + return + elif err == 0: + log.info(f"Proxy functions obtained") + + # Writing the proxy functions to a file + + # Only give function name and proxy name + trace_json = {} + for function in trace_functions: + trace_json[function] = {} + trace_json[function]["proxy-function"] = trace_functions[function]["proxy-function"] + + try: + with open(output_filepath, "w") as jf: + json.dump(trace_json, jf, indent=4) + except Exception as e: + log.critical(f"Output file {output_filepath} cannot be written. Error: {e}") + log.critical(f"Load Generation failed") + return + + log.info(f"Output file {output_filepath} written") + log.info(f"Load Generation successful") + +if __name__ == "__main__": + main() \ No newline at end of file diff --git a/tools/mapper/profile.tar.gz b/tools/mapper/profile.tar.gz new file mode 100644 index 000000000..a0cba432c --- /dev/null +++ b/tools/mapper/profile.tar.gz @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3358e68efe00f99ca099095c3920c9f067e66a20b7edea7f4cc55990332901e4 +size 44662