jl3953 · Jun 16, 2021
diff --git a/‎.gitignore
+5 b/‎.gitignore
+5
diff --git a/‎README.md
+84 b/‎README.md
+84
diff --git a/‎config/async_lt.ini
+3 b/‎config/async_lt.ini
+3
diff --git a/‎config/lt.ini
+3 b/‎config/lt.ini
+3
diff --git a/‎src/README.md
+84 b/‎src/README.md
+84
diff --git a/‎src/async_config_object.py
+88 b/‎src/async_config_object.py
+88
diff --git a/‎src/async_determine_stable_interval.py
+70 b/‎src/async_determine_stable_interval.py
+70
@@ -0,0 +1,5 @@
+scratch/*
+src/__pycache__/*
+*.pyc
+config/2021*_*.ini
+src/trial_*_*.py
@@ -0,0 +1,84 @@
+# Hotnode incorporation checklist
+1) Did you change the hotnode address (`node-X:50051`) in cockroachdb 
+   `pkg/server/server.go`?
+   
+2) Does that address match the one in your `trial_<config_object_name>.py`
+in `self.hot_node`?
+    
+3) Did you change the hotkey threshold to be what you want in CRDB
+`pkg/sql/conn_executor_prepare.go` in `isHotkey(key byte[])`?
+   
+4) Does that threshold match the one in `trial_<config_object_name>.py`
+in `self.hot_node_threshold`?
+
+# How to implement a new server-client test script on branch async_redo
+
+1) Copy `src/async_config_object` and name it 
+   `trial_<whatever_you_want>.py`. The `.gitignore` will
+   ignore it. 
+   - Make sure you populate the fields under the `#default`
+    comment.
+   - Make sure all methods are correctly written,
+    especially the part on populating server and client nodes.
+     For example, are the nodes regioned? Does it matter?
+   - Make sure `generate_all_config_files()` method is implemented.
+   - Make sure the concurrency of the clients is always called 
+     "concurrency" (`self.concurrency` in `ConfigObject`)
+
+2) Change the fields you need to.
+
+3) Change `config/async_lt.ini` for latency-throughput.
+
+4) Implement to the interface of `src/async_server.py`.
+    - When implementing `aggregate_raw_logs()` function,
+    make sure to use the keys
+      - throughput: `"ops/sec(cum)"`
+      - p50: `"p50(ms)"`
+      - p99: `"p99(ms)"`
+    or the latency throughput graphs won't gnuplot at all
+   - Make sure gnuplot is installed (`apt install gnuplot-x11`)
+
+5) Whatever you name your implementation from the previous
+step, change the line `import async_server` in `src/async_main.py`
+   to `import <whatever_you_implemented> as async_server`
+    
+6) Configure/implement the swath of functions at the
+head of `src/async_main.py` to match your needs.
+   - Make sure the directory is correct. It's set to 
+    `thermopylae_tests/scratch/db_{datetime}` right now.
+     
+7) From `~/thermopylae_tests` directory, run `python3 src/async_main.py`
+   
+# How to implement new `async_determine_stable_interval.py` on branch async_redo
+1) Code to the interface of `src/async_server.py`
+2) Replace `import async_server` with `import <whatever_you_coded> as async_server`
+3) From `~/thermopylae_tests` dir, run `python3 src/async_determine_stable_interval.py
+   --duration 30s --csv_location scratch/stabilizer --graph_location scratch/stabilizer`
+   
+# How to add your config
+1) Make a copy of `src/config_object.py` and name it `trial_<whatever_you_want>.py`.
+The `.gitignore` will ignore it in the directory. 
+2) Change the fields that you need to. Add ones you need.
+    - You may need to implement new functionality that goes along with any new
+    fields.
+3) Determine what latency throughput files should match it (choose the range and
+step_size). See `config/lt.ini` for the default example.
+4) In `src/main.py`, add your new `trial_<whatever_you_want>.py` file with the
+filepath of the latency throughput file to the configuration section. Remember to
+import the config object files in `src/main.py`.
+5) Make sure the sqlite database directory is what you want it to be (by default, 
+it is set to to `/proj/cops-PG0/workspaces/jl87`)
+6) IMPORTANT: if any nodes have crashed, make sure to add their ip_enums as *args
+   in `enumerate_workload_nodes(...)` and `enumerate_warm_nodes(...)`. For example:
+   `enumerate_workload_nodes(driver_node_ip_enum, num_workload_nodes, 2, 5, 6)`
+   for node-1, node-4, and node-5.
+   Don't forget to repeat for `enumerate_warm_nodes(...)`.
+7) From the git root, run: `./src/main.py`
+
+### Need to Implement
+- Automatic start-up of chosen hotshard node.
+- Extracting of the cockroach commit in the copied parameter ini files instead of
+just the branch name, which may or may not exist at a further point in time.
+
+### Not Implemented
+- Partition affinity
@@ -0,0 +1,3 @@
+[DEFAULT]
+concurrency = [16, 56]
+step_size = 8
@@ -0,0 +1,3 @@
+[DEFAULT]
+concurrency = [32, 160]
+step_size = 8
@@ -0,0 +1,84 @@
+# Hotnode incorporation checklist
+1) Did you change the hotnode address (`node-X:50051`) in cockroachdb 
+   `pkg/server/server.go`?
+   
+2) Does that address match the one in your `trial_<config_object_name>.py`
+in `self.hot_node`?
+    
+3) Did you change the hotkey threshold to be what you want in CRDB
+`pkg/sql/conn_executor_prepare.go` in `isHotkey(key byte[])`?
+   
+4) Does that threshold match the one in `trial_<config_object_name>.py`
+in `self.hot_node_threshold`?
+
+# How to implement a new server-client test script on branch async_redo
+
+1) Copy `src/async_config_object` and name it 
+   `trial_<whatever_you_want>.py`. The `.gitignore` will
+   ignore it. 
+   - Make sure you populate the fields under the `#default`
+    comment.
+   - Make sure all methods are correctly written,
+    especially the part on populating server and client nodes.
+     For example, are the nodes regioned? Does it matter?
+   - Make sure `generate_all_config_files()` method is implemented.
+   - Make sure the concurrency of the clients is always called 
+     "concurrency" (`self.concurrency` in `ConfigObject`)
+
+2) Change the fields you need to.
+
+3) Change `config/async_lt.ini` for latency-throughput.
+
+4) Implement to the interface of `src/async_server.py`.
+    - When implementing `aggregate_raw_logs()` function,
+    make sure to use the keys
+      - throughput: `"ops/sec(cum)"`
+      - p50: `"p50(ms)"`
+      - p99: `"p99(ms)"`
+    or the latency throughput graphs won't gnuplot at all
+   - Make sure gnuplot is installed (`apt install gnuplot-x11`)
+
+5) Whatever you name your implementation from the previous
+step, change the line `import async_server` in `src/async_main.py`
+   to `import <whatever_you_implemented> as async_server`
+    
+6) Configure/implement the swath of functions at the
+head of `src/async_main.py` to match your needs.
+   - Make sure the directory is correct. It's set to 
+    `thermopylae_tests/scratch/db_{datetime}` right now.
+     
+7) From `~/thermopylae_tests` directory, run `python3 src/async_main.py`
+   
+# How to implement new `async_determine_stable_interval.py` on branch async_redo
+1) Code to the interface of `src/async_server.py`
+2) Replace `import async_server` with `import <whatever_you_coded> as async_server`
+3) From `~/thermopylae_tests` dir, run `python3 src/async_determine_stable_interval.py
+   --duration 30s --csv_location scratch/stabilizer --graph_location scratch/stabilizer`
+   
+# How to add your config
+1) Make a copy of `src/config_object.py` and name it `trial_<whatever_you_want>.py`.
+The `.gitignore` will ignore it in the directory. 
+2) Change the fields that you need to. Add ones you need.
+    - You may need to implement new functionality that goes along with any new
+    fields.
+3) Determine what latency throughput files should match it (choose the range and
+step_size). See `config/lt.ini` for the default example.
+4) In `src/main.py`, add your new `trial_<whatever_you_want>.py` file with the
+filepath of the latency throughput file to the configuration section. Remember to
+import the config object files in `src/main.py`.
+5) Make sure the sqlite database directory is what you want it to be (by default, 
+it is set to to `/proj/cops-PG0/workspaces/jl87`)
+6) IMPORTANT: if any nodes have crashed, make sure to add their ip_enums as *args
+   in `enumerate_workload_nodes(...)` and `enumerate_warm_nodes(...)`. For example:
+   `enumerate_workload_nodes(driver_node_ip_enum, num_workload_nodes, 2, 5, 6)`
+   for node-1, node-4, and node-5.
+   Don't forget to repeat for `enumerate_warm_nodes(...)`.
+7) From the git root, run: `./src/main.py`
+
+### Need to Implement
+- Automatic start-up of chosen hotshard node.
+- Extracting of the cockroach commit in the copied parameter ini files instead of
+just the branch name, which may or may not exist at a further point in time.
+
+### Not Implemented
+- Partition affinity
@@ -0,0 +1,88 @@
+import itertools
+
+import config_io
+import config_object as co
+import node
+
+
+class ConfigObject:
+
+    def __init__(self):
+
+        # default YOU MUST POPULATE THESE FIELDS
+        self.trials = [i for i in range(1)]
+        self.logs_dir = ["test"]
+        self.store_dir = ["async_server"]
+
+        # server
+        self.server_concurrency = [1]
+        self.server_commit_branch = ["async"]
+        self.server_node_ip_enum = [2]  # 196.168.1.???
+        # self.server_node = [some Node object]
+
+        # client
+        self.client_commit_branch = ["async"]
+        self.num_workload_nodes = [2]
+        self.concurrency = [10] # YOU MUST CALL CLIENT CONCURRENCY "CONCURRENCY"
+        self.driver_node_ip_enum = [i + 1 for i in self.server_node_ip_enum]  # 192.168.1.???
+        self.duration = [3]  # duration of trial in seconds
+        # self.workload_nodes [some Node objects]
+
+        # workload
+        self.batch = [1]  # keys per rpc
+        self.read_percent = [95]
+
+    def generate_config_combinations(self):
+        """Generates the trial configuration parameters for a single run,
+        lists all in a list of dicts.
+
+        :return: a list of dictionaries of combinations
+        """
+
+        temp_dict = vars(self)
+        all_field_values = list(temp_dict.values())
+        values_combinations = list(itertools.product(*all_field_values))
+
+        combinations = []
+        for combo in values_combinations:
+            config_dict = dict(zip(temp_dict.keys(), combo))
+            combinations.append(config_dict)
+
+        # populating node information. MAKE SURE THIS PART IS CORRECTLY WRITTEN
+        for config_dict in combinations:
+            driver_node_ip_enum = config_dict["driver_node_ip_enum"]
+            num_workload_nodes = config_dict["num_workload_nodes"]
+            workload_nodes, _ = co.ConfigObject.enumerate_workload_nodes(
+                driver_node_ip_enum, num_workload_nodes)
+            config_dict["workload_nodes"] = [vars(n) for n in workload_nodes]
+
+            server_node_ip_enum = config_dict["server_node_ip_enum"]
+            server_node = ConfigObject.create_server_node(server_node_ip_enum)
+            config_dict["server_node"] = vars(server_node)
+
+        return combinations
+
+    @staticmethod
+    def create_server_node(server_node_ip_enum):
+        return node.Node(server_node_ip_enum)
+
+    def generate_all_config_files(self):
+        """Generates all configuration files with different combinations of parameters.
+        :return:
+        """
+        ini_fpaths = []
+        config_combos = self.generate_config_combinations()
+        for config_dict in config_combos:
+            ini_fpath = co.ConfigObject.generate_ini_filename(suffix=config_dict["logs_dir"])
+            ini_fpaths.append(config_io.write_config_to_file(config_dict, ini_fpath))
+
+        return ini_fpaths
+
+
+def main():
+    config_object = ConfigObject()
+    print(config_object.generate_config_combinations())
+
+
+if __name__ == "__main__":
+    main()
@@ -0,0 +1,70 @@
+import argparse
+import os
+import sys
+
+import async_config_object
+import async_server
+
+CONFIG_OBJ_LIST = [
+    async_config_object.ConfigObject(),
+]
+
+
+def main():
+    parser = argparse.ArgumentParser(description="Determine a stable interval")
+    parser.add_argument("--duration", type=int, default=20 * 60,
+                        help="Duration (s) that to run test for")
+    parser.add_argument("--csv_location", type=str,
+                        default=os.path.join(os.getcwd(), "scratch/stabilizer"), 
+                        help="location of resulting csv file")
+    parser.add_argument("--graph_location", type=str,
+                        default=os.path.join(os.getcwd(), "scratch/stabilizer"),
+                        help="location of resulting graph")
+    args = parser.parse_args()
+
+    # Generate configurations
+    configs = []
+    for config_object in CONFIG_OBJ_LIST:
+        configs += config_object.generate_config_combinations()
+
+    # Run each configuration
+    for config in configs:
+
+        # clean up all experiments first
+        for node in config["workload_nodes"] + [config["server_node"]]:
+            async_server.kill(node)
+
+        # server
+        async_server.build_server(config["server_node"],
+                                  config["server_commit_branch"])
+        _ = async_server.run_server(config["server_node"],
+                                    config["server_concurrency"])
+
+        # clients
+        if not os.path.exists(args.csv_location):
+            os.mkdir(args.csv_location)
+        for client in config["workload_nodes"]:
+            async_server.build_client(client, config["server_commit_branch"])
+        logfiles = async_server.run_clients(config["workload_nodes"],
+                                            config["server_node"],
+                                            args.duration,
+                                            config["concurrency"],
+                                            config["batch"],
+                                            config["read_percent"],
+                                            args.csv_location)
+
+        # graph
+        dat_file = async_server.parse_raw_logfiles(logfiles, args.csv_location)
+        if not os.path.exists(args.graph_location):
+            os.mkdir(args.graph_location)
+        async_server.graph(dat_file, args.graph_location)
+
+        # clean up again
+        for node in config["workload_nodes"] + [config["server_node"]]:
+            async_server.kill(node)
+
+    return 0
+
+
+if __name__ == "__main__":
+    sys.exit(main())
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+[DEFAULT]`
	`2`	`+concurrency = [16, 56]`
	`3`	`+step_size = 8`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+[DEFAULT]`
	`2`	`+concurrency = [32, 160]`
	`3`	`+step_size = 8`