From 6c4739f2811aec67b3c3fa93a21f55bc8711f92c Mon Sep 17 00:00:00 2001
From: KylerAce <kylerlumpkin1@gmail.com>
Date: Sun, 26 Dec 2021 21:43:10 -0800
Subject: [PATCH 1/5] creates stats and graphing for the sendmaps profiler logs

---
 Update.bat                |   3 +-
 root/MaptickAverager.py   | 129 +++++++++++++++++++++++++++++++++++++-
 root/RawLogsScraper.py    |  10 ++-
 root/SingleRound.py       |   4 +-
 root/maptick_plot.gnuplot |  52 ++++++++++-----
 5 files changed, 175 insertions(+), 23 deletions(-)

diff --git a/Update.bat b/Update.bat
index 0257bd2..b3c8e9c 100644
--- a/Update.bat
+++ b/Update.bat
@@ -9,4 +9,5 @@ echo Averaging CSV files
 py MaptickAverager.py
 echo Plotting Graphs
 gnuplot maptick_plot.gnuplot
-popd "%~dp0"
\ No newline at end of file
+popd "%~dp0"
+pause
\ No newline at end of file
diff --git a/root/MaptickAverager.py b/root/MaptickAverager.py
index 060e68d..670af7c 100644
--- a/root/MaptickAverager.py
+++ b/root/MaptickAverager.py
@@ -15,6 +15,10 @@
 data_file = "data/last_run.dat"
 old_data_file = f"{output_loc}last_run.dat"
 
+#converts a float input measured in seconds to one in microseconds
+def to_microseconds(value):
+    return value * 1000 * 1000
+
 #Converts a log file into a dict
 def log_file_to_dict():
     write_to = {}
@@ -207,7 +211,7 @@ def add_new_value(list, new_value, value_creator):
 highpass = 2.5 #Cuts out the pain stuff while still allowing the carpet bump to remain clear
 data_log["highpass_threshold"] = highpass
 
-keys_to_average = ["maptick_to_player", "maptick", "players", "td", "td_to_player"]
+keys_to_average = ["maptick_to_player", "maptick", "players", "td", "td_to_player", "sendmaps_cost_per_tick", "per_client", "look_for_movable_changes", "check_turf_vis_conts", "check_hud/image_vis_contents", "turfs_in_range", "obj_changes", "mob_changes", "movables_examined"]
 
 input = glob.glob("output/*.csv")
 
@@ -233,7 +237,8 @@ def add_new_value(list, new_value, value_creator):
 maps_we_care_about = ["Delta%20Station", "Ice%20Box%20Station", "Kilo%20Station", "MetaStation", "Tramstation"]
 
 data = {} #Dictionary of file names to dictionaries of data to be written later.
- 
+
+# first pass of data parsing: populate the data dictionary with info
 # for all round ids we've not ingested before
 for index in range(id_start_at, len(input)):
     f_name = input[index]
@@ -242,6 +247,34 @@ def add_new_value(list, new_value, value_creator):
     player_total = 0
     td_total = 0
 
+    sendmaps_total_cost = 0 #all of these only use the last rows data which is the real total for that round
+    sendmaps_total_calls = 0
+
+    sendmaps_client_cost = 0
+    sendmaps_client_calls = 0
+
+    movable_changes_cost = 0
+    movable_changes_calls = 0
+
+    check_turf_vis_contents_cost = 0
+    check_turf_vis_contents_calls = 0
+
+    check_hud_image_vis_contents_cost = 0
+    check_hud_image_vis_contents_calls = 0
+
+    loop_turfs_in_range_cost = 0
+    loop_turfs_in_range_calls = 0
+
+    obj_changes_cost = 0
+    obj_changes_calls = 0
+
+    mob_changes_cost = 0
+    mob_changes_calls = 0
+
+    movables_examined = 0
+
+    has_sendmaps_profiler_logs = False
+
     csvfile = open(f_name, newline='')
     reader = csv.DictReader(csvfile)
     #read all the data 
@@ -250,6 +283,35 @@ def add_new_value(list, new_value, value_creator):
         maptick_total += float(row["maptick"])
         player_total += float(row["players"])
         td_total += float(row["tidi_avg"]) 
+
+        sendmaps_total_cost = float(row.get("send_maps") or 0)#the last row read is the final value for these
+        sendmaps_total_calls = float(row.get("send_maps_count") or 0)#have to use .get(index) or 0 because not all logs have these indices
+        if sendmaps_total_cost != 0.0:
+            has_sendmaps_profiler_logs = True
+
+        sendmaps_client_cost = float(row.get("per_client") or 0)
+        sendmaps_client_calls = float(row.get("per_client_count") or 0)
+
+        movable_changes_cost = float(row.get("look_for_movable_changes") or 0)
+        movable_changes_calls = float(row.get("look_for_movable_changes_count") or 0)
+
+        check_turf_vis_contents_cost = float(row.get("check_turf_vis_conts") or 0)
+        check_turf_vis_contents_calls = float(row.get("check_turf_vis_conts_count") or 0)
+
+        check_hud_image_vis_contents_cost = float(row.get("check_hud/image_vis_contents") or 0)
+        check_hud_image_vis_contents_calls = float(row.get("check_hud/image_vis_contents_count") or 0)
+
+        loop_turfs_in_range_cost = float(row.get("turfs_in_range") or 0)
+        loop_turfs_in_range_calls = float(row.get("turfs_in_range_count") or 0)
+
+        obj_changes_cost = float(row.get("obj_changes") or 0)
+        obj_changes_calls = float(row.get("obj_changes_count") or 0)
+
+        mob_changes_cost = float(row.get("mob_changes") or 0)
+        mob_changes_calls = float(row.get("mob_changes_count") or 0)
+
+        movables_examined = float(row.get("movables_examined") or 0)
+
     csvfile.close()
 
     #In the template perf-[roundid]-[mapname]-[servername].csv
@@ -277,6 +339,55 @@ def add_new_value(list, new_value, value_creator):
     avg_maptick = 0
     avg_players = 0
     avg_td = 0
+
+    sendmaps_cost_per_tick = 0 #absolute cost values: either milliseconds, microseconds, or total movables examined
+    sendmaps_clients = 0
+    avg_cost_per_client = 0
+    avg_cost_movable_changes = 0
+    avg_cost_turf_vis_contents = 0
+    avg_cost_hud_image_vis_contents = 0
+    avg_cost_turfs_in_range = 0
+    avg_cost_obj_changes = 0
+    avg_cost_mob_changes = 0
+    avg_movables_examined = 0
+
+    look_for_movable_changes_percent = 0 #relative cost percentage values: percentage of sendmaps total cost
+    turf_vis_contents_percent = 0
+    hud_image_vis_contents_percent = 0
+    loop_turfs_in_range_percent = 0
+    send_obj_changes_percent = 0
+    send_mob_changes_percent = 0
+
+    if has_sendmaps_profiler_logs:
+        #the cost vars are always in seconds which makes most of them very small. converting to microseconds is much better
+        sendmaps_cost_per_tick = to_microseconds(sendmaps_total_cost / sendmaps_total_calls)
+        sendmaps_clients = sendmaps_client_calls / sendmaps_total_calls 
+
+        if sendmaps_client_calls:
+            avg_cost_per_client = to_microseconds(sendmaps_total_cost / sendmaps_client_calls)
+        if movable_changes_calls:
+            avg_cost_movable_changes = to_microseconds(movable_changes_cost / movable_changes_calls)
+        if check_turf_vis_contents_calls:
+            avg_cost_turf_vis_contents = to_microseconds(check_turf_vis_contents_cost / check_turf_vis_contents_calls)
+        if check_hud_image_vis_contents_calls:
+            avg_cost_hud_image_vis_contents = to_microseconds(check_hud_image_vis_contents_cost / check_hud_image_vis_contents_calls)
+        if loop_turfs_in_range_calls:
+            avg_cost_turfs_in_range = to_microseconds(loop_turfs_in_range_cost / loop_turfs_in_range_calls)
+        if obj_changes_calls:
+            avg_cost_obj_changes = to_microseconds(obj_changes_cost / obj_changes_calls)
+        if mob_changes_calls:
+            avg_cost_mob_changes = to_microseconds(mob_changes_cost / mob_changes_calls)
+        if sendmaps_client_calls:
+            avg_movables_examined = movables_examined / sendmaps_client_calls
+
+        if sendmaps_total_cost:
+            look_for_movable_changes_percent = 100 * movable_changes_cost / sendmaps_total_cost
+            turf_vis_contents_percent = 100 * check_turf_vis_contents_cost / sendmaps_total_cost
+            hud_image_vis_contents_percent = 100 * check_hud_image_vis_contents_cost / sendmaps_total_cost
+            loop_turfs_in_range_percent = 100 * loop_turfs_in_range_cost / sendmaps_total_cost
+            send_obj_changes_percent = 100 * obj_changes_cost / sendmaps_total_cost
+            send_mob_changes_percent = 100 * mob_changes_cost / sendmaps_total_cost
+
     if player_total:
         maptick_by_players = maptick_total / player_total
         td_by_players = td_total / player_total
@@ -285,7 +396,7 @@ def add_new_value(list, new_value, value_creator):
         avg_players = player_total / lines_read
         avg_td = td_total / lines_read
 
-    #I'm sorry
+    #finalize our data collection by map, server, and generic single stat files
     pending = [map, server, "maptick", "highpass_maptick"]
     for index in pending:
         if index not in data: #If one doesn't already exist, make a new list to put our map data into
@@ -299,9 +410,21 @@ def add_new_value(list, new_value, value_creator):
         to_write["maptick"] = avg_maptick
         to_write["players"] = avg_players 
         to_write["td"] = avg_td
+
         if td_by_players > 1.2:
             td_by_players = 0.6
         to_write["td_to_player"] = td_by_players
+
+        to_write["sendmaps_cost_per_tick"] = sendmaps_cost_per_tick
+        to_write["per_client"] = avg_cost_per_client
+        to_write["look_for_movable_changes"] = avg_cost_movable_changes
+        to_write["check_turf_vis_conts"] = avg_cost_turf_vis_contents
+        to_write["check_hud/image_vis_contents"] = avg_cost_hud_image_vis_contents
+        to_write["turfs_in_range"] = avg_cost_turfs_in_range
+        to_write["obj_changes"] = avg_cost_obj_changes
+        to_write["mob_changes"] = avg_cost_mob_changes
+        to_write["movables_examined"] = avg_movables_examined
+
         data[index].append(to_write)
 
     print(f"Read [{id}] [{map}] [{server}]")
diff --git a/root/RawLogsScraper.py b/root/RawLogsScraper.py
index 7a61e08..2ee8cdd 100644
--- a/root/RawLogsScraper.py
+++ b/root/RawLogsScraper.py
@@ -95,6 +95,7 @@ def __init__(self, expression, message):
 class Buffer:
 
     def __init__(self, size, server, lastUrl = ""):
+        #how many files we can hold in our buffer before we have to write them all to data buffers
         self.size = size
         # List of [url, fileName, text]s
         self.fileBuffer = []
@@ -103,6 +104,7 @@ def __init__(self, size, server, lastUrl = ""):
         # Our last saved url
         self.previousUrl = lastUrl
 
+    #write every data file we have in our buffer to a data file in the output folder
     def dumpBuffer(self):
         if len(self.fileBuffer) == 0:
             return
@@ -127,6 +129,7 @@ def writeToBuffer(self, url, fileName, text):
             return
         self.dumpBuffer()
 
+#writes to the lastrun.dat file to store info on the current scraping run
 def writeDataFile(server, roundUrl, previousUrl):
     master_info = scraped_info
     
@@ -168,6 +171,7 @@ def clearDataFile():
 #fakingIdentity = json.load(do_not_post_this_4head) #Loads a .json file containing the cookie and other params to send to mso
 #do_not_post_this_4head.close()
 
+#return the file located at the given url if possible
 def get_url(requestTarget) :
     for i in range(1, retry_limit):
         response = requests.get(requestTarget, headers = fakingIdentity)
@@ -236,7 +240,7 @@ def listFD(url):
     #return [node.get('href') for node in soup.find_all('a')]
 
 def readFile(url, name, serverName, fileBuffer):
-    response = get_url(url)
+    targeted_file = get_url(url)
     name = name.rstrip('.gz')
     name_parts = name.split(".")
     name_parts[0] += f"-{serverName}"
@@ -244,13 +248,13 @@ def readFile(url, name, serverName, fileBuffer):
     filename = outputFolder + name
 
     #The exists check prevents overscanning, if you fuck something up comment it out 
-    if not response: 
+    if not targeted_file: 
         return -1
     
     if os.path.exists(filename):
         return -1
     
-    fileBuffer.writeToBuffer(url, filename, response.text)
+    fileBuffer.writeToBuffer(url, filename, targeted_file.text)
 
 def roundAge(round):
     # If you're not a string (Not a round id) I'm not interested
diff --git a/root/SingleRound.py b/root/SingleRound.py
index 695c153..a9da736 100644
--- a/root/SingleRound.py
+++ b/root/SingleRound.py
@@ -11,7 +11,7 @@
 output_to = "single_round/temporary"
 read_from = "output/"
 sendmaps_starting = ["send_maps", "initial_house", "cleanup", "client_loop", "per_client", "deleted_images", "hud_update", "statpanel_update", "map_data", "check_eye_pos", "update_chunks", "turfmap_updates", "changed_turfs", "turf_chunk_info", "obj_changes", "mob_changes", "send_turf_vis_conts", "pending_animations", "look_for_movable_changes", "check_turf_vis_conts", "check_hud/image_vis_contents", "turfs_in_range", "movables_examined"]
-sendmaps_grunge = []
+sendmaps_grunge = []#like above but everything ends in _count. theyre just # of calls for that thing
 for name in sendmaps_starting:
     sendmaps_grunge += [name + "_count"]
 
@@ -36,7 +36,7 @@
 reader = csv.DictReader(csvfile)
 
 output = open(f"{output_to}.csv", 'w')
-writer = csv.DictWriter(output, fieldnames=fieldnames+sendmaps_grunge+sendmaps_starting)
+writer = csv.DictWriter(output, fieldnames=fieldnames + sendmaps_grunge + sendmaps_starting)
 writer.writeheader()
 
 for row in reader:
diff --git a/root/maptick_plot.gnuplot b/root/maptick_plot.gnuplot
index cb233c2..4b5caf8 100644
--- a/root/maptick_plot.gnuplot
+++ b/root/maptick_plot.gnuplot
@@ -28,6 +28,13 @@ outputfile10 = sprintf("%s Average By Map%s", filename, outputformat)
 outputfile11 = sprintf("%s Average By Server%s", filename, outputformat)
 outputfile12 = sprintf("%s%s", filename, outputformat)
 
+filename = "SendMaps Profiler"
+filename = sprintf("%s%s", outputfolder, filename)
+outputfile13 = sprintf("%s Average%s", filename, outputformat)
+outputfile14 = sprintf("%s Average By Map%s", filename, outputformat)
+outputfile15 = sprintf("%s Average By Server%s", filename, outputformat)
+#outputfile16 = sprintf("%s Average%s", filename, outputformat)
+
 set key autotitle columnheader 
 set key noenhanced
 set term png size 1000, 600 
@@ -41,11 +48,12 @@ set yrange [0:]
 set grid ytics
 
 #CSV file is formatted like this
-# id, maptick_to_player, maptick, players, td, td_to_player
-# followed by three entries for everything but the id. avg, min, and max
+# id, maptick_to_player, maptick, players, td, td_to_player, sendmaps_cost_per_tick, per_client, look_for_movable_changes, check_turf_vis_conts, check_hud/image_vis_contents, turfs_in_range, obj_changes, mob_changes, movables_examined
+# followed by three entries for everything but the id: the avg, the min, and the max
 
 #To find the index of the header you want, use this forumula
-# 6 + ((spot in list - 2) * 3) + (spot in list - 1) * header you want
+# 15 + ((spot in list - 2) * 3) + (spot in list - 1) * header you want
+#I HAVE NO IDEA HOW THESE ARE DERIVED REEEEEEEEEEEEEE
 
 highpass = "highpass_maptick.csv"
 highpass = sprintf("%s%s", inputfolder, highpass)
@@ -53,12 +61,12 @@ highpass = sprintf("%s%s", inputfolder, highpass)
 set rmargin 13
 set output outputfile1
 set title "MPP (High Pass Filter)"
-plot highpass using 1:2 with lines title "Maptick Per Player"
+plot highpass using 1:7 with lines title "Maptick Per Player"
 
 set rmargin 13
 set output outputfile2
 set title "MPP"
-plot inputfile using 1:2 with lines title "Maptick Per Player"
+plot inputfile using 1:7 with lines title "Maptick Per Player"
 
 set rmargin 22
 set output outputfile3
@@ -72,40 +80,56 @@ serverfiles = "manuel.csv basil.csv sybil.csv terry.csv"
 
 set output outputfile4
 set title "Average Maptick Over Player Count By Map"
-plot for [file in mapfiles] sprintf("%s%s", inputfolder, file) using 1:7 with lines title file 
+plot for [file in mapfiles] sprintf("%s%s", inputfolder, file) using 1:16 with lines title file 
 
 set output outputfile5
 set title "Average Maptick Over Player Count By Server"
-plot for [file in serverfiles] sprintf("%s%s", inputfolder, file) using 1:7 with lines title file 
+plot for [file in serverfiles] sprintf("%s%s", inputfolder, file) using 1:16 with lines title file 
 
 set ylabel 'Player Count'
 
 set output outputfile6
 set title "Average Player Count"
-plot inputfile using 1:15 with lines
+plot inputfile using 1:22 with lines
 
 set output outputfile7
 set title "Average Player Count By Map"
-plot for [file in mapfiles] sprintf("%s%s", inputfolder, file) using 1:15 with lines title file
+plot for [file in mapfiles] sprintf("%s%s", inputfolder, file) using 1:22 with lines title file
 
 set output outputfile8
 set title "Average Player Count By Server"
-plot for [file in serverfiles] sprintf("%s%s", inputfolder, file) using 1:15 with lines title file
+plot for [file in serverfiles] sprintf("%s%s", inputfolder, file) using 1:22 with lines title file
 
 set ylabel 'TD'
 
 set output outputfile9
 set title "Average TD"
-plot inputfile using 1:16 with lines
+plot inputfile using 1:25 with lines
 
 set output outputfile10
 set title "Average TD By Map"
-plot for [file in mapfiles] sprintf("%s%s", inputfolder, file) using 1:16 with lines title file
+plot for [file in mapfiles] sprintf("%s%s", inputfolder, file) using 1:25 with lines title file
 
 set output outputfile11
 set title "Average TD By Server"
-plot for [file in serverfiles] sprintf("%s%s", inputfolder, file) using 1:16 with lines title file
+plot for [file in serverfiles] sprintf("%s%s", inputfolder, file) using 1:25 with lines title file
 
 set output outputfile12
 set title "TD"
-plot inputfile using 1:5 with lines title "TD"
\ No newline at end of file
+plot inputfile using 1:5 with lines title "TD"
+
+set ylabel 'Microseconds'
+
+set output outputfile13
+set title "Average Costs"
+plot inputfile using 1:34 with lines, '' using 1:37 with lines, '' using 1:40 with lines, '' using 1:43 with lines, '' using 1:46 with lines, '' using 1:49 with lines, '' using 1:52 with lines, '' using 1:55 with lines
+
+set ylabel "Count"
+
+set output outputfile14
+set title "Movable Count By Map"
+plot for [file in mapfiles] sprintf("%s%s", inputfolder, file) using 1:55 with lines title file
+
+set output outputfile15
+set title "Movable Count By Server"
+plot for [file in serverfiles] sprintf("%s%s", inputfolder, file) using 1:55 with lines title file
\ No newline at end of file

From c5d6080aa707b1cd3f3dec87c07b9562c7bf8a70 Mon Sep 17 00:00:00 2001
From: KylerAce <kylerlumpkin1@gmail.com>
Date: Sun, 26 Dec 2021 22:06:51 -0800
Subject: [PATCH 2/5] defines a sane x range for the profiler graphs and
 removes unused stats

---
 root/MaptickAverager.py   | 15 ---------------
 root/maptick_plot.gnuplot |  3 ++-
 2 files changed, 2 insertions(+), 16 deletions(-)

diff --git a/root/MaptickAverager.py b/root/MaptickAverager.py
index 670af7c..9a97464 100644
--- a/root/MaptickAverager.py
+++ b/root/MaptickAverager.py
@@ -351,13 +351,6 @@ def add_new_value(list, new_value, value_creator):
     avg_cost_mob_changes = 0
     avg_movables_examined = 0
 
-    look_for_movable_changes_percent = 0 #relative cost percentage values: percentage of sendmaps total cost
-    turf_vis_contents_percent = 0
-    hud_image_vis_contents_percent = 0
-    loop_turfs_in_range_percent = 0
-    send_obj_changes_percent = 0
-    send_mob_changes_percent = 0
-
     if has_sendmaps_profiler_logs:
         #the cost vars are always in seconds which makes most of them very small. converting to microseconds is much better
         sendmaps_cost_per_tick = to_microseconds(sendmaps_total_cost / sendmaps_total_calls)
@@ -380,14 +373,6 @@ def add_new_value(list, new_value, value_creator):
         if sendmaps_client_calls:
             avg_movables_examined = movables_examined / sendmaps_client_calls
 
-        if sendmaps_total_cost:
-            look_for_movable_changes_percent = 100 * movable_changes_cost / sendmaps_total_cost
-            turf_vis_contents_percent = 100 * check_turf_vis_contents_cost / sendmaps_total_cost
-            hud_image_vis_contents_percent = 100 * check_hud_image_vis_contents_cost / sendmaps_total_cost
-            loop_turfs_in_range_percent = 100 * loop_turfs_in_range_cost / sendmaps_total_cost
-            send_obj_changes_percent = 100 * obj_changes_cost / sendmaps_total_cost
-            send_mob_changes_percent = 100 * mob_changes_cost / sendmaps_total_cost
-
     if player_total:
         maptick_by_players = maptick_total / player_total
         td_by_players = td_total / player_total
diff --git a/root/maptick_plot.gnuplot b/root/maptick_plot.gnuplot
index 4b5caf8..73ab819 100644
--- a/root/maptick_plot.gnuplot
+++ b/root/maptick_plot.gnuplot
@@ -119,10 +119,11 @@ set title "TD"
 plot inputfile using 1:5 with lines title "TD"
 
 set ylabel 'Microseconds'
+set xrange [163000:]
 
 set output outputfile13
 set title "Average Costs"
-plot inputfile using 1:34 with lines, '' using 1:37 with lines, '' using 1:40 with lines, '' using 1:43 with lines, '' using 1:46 with lines, '' using 1:49 with lines, '' using 1:52 with lines, '' using 1:55 with lines
+plot inputfile using 1:34 with lines, '' using 1:37 with lines, '' using 1:40 with lines, '' using 1:43 with lines, '' using 1:46 with lines, '' using 1:49 with lines, '' using 1:52 with lines#, '' using 1:55 with lines
 
 set ylabel "Count"
 

From 2d68ca94bcf8d026d7551372c88eb68cefc1923c Mon Sep 17 00:00:00 2001
From: KylerAce <kylerlumpkin1@gmail.com>
Date: Thu, 18 Aug 2022 20:11:48 -0700
Subject: [PATCH 3/5] creates TrackStat class to help easily define new stats

---
 root/MaptickAverager.py   | 421 ++++++++++++++++++++++++++------------
 root/SingleRound.py       |   4 -
 root/maptick_plot.gnuplot |   1 -
 3 files changed, 291 insertions(+), 135 deletions(-)

diff --git a/root/MaptickAverager.py b/root/MaptickAverager.py
index 9a97464..83f5dda 100644
--- a/root/MaptickAverager.py
+++ b/root/MaptickAverager.py
@@ -3,6 +3,8 @@
 import os
 import os.path
 import sys
+import enum
+from enum import auto
 
 MAX = sys.float_info.max
 
@@ -15,11 +17,15 @@
 data_file = "data/last_run.dat"
 old_data_file = f"{output_loc}last_run.dat"
 
-#converts a float input measured in seconds to one in microseconds
+# converts a float input measured in seconds to one in microseconds
+
+
 def to_microseconds(value):
     return value * 1000 * 1000
 
-#Converts a log file into a dict
+# Converts a log file into a dict
+
+
 def log_file_to_dict():
     write_to = {}
     file_path = data_file
@@ -28,43 +34,47 @@ def log_file_to_dict():
         file_path = old_data_file
         if not os.path.exists(file_path):
             return write_to
-    
-    #A data file holding info about the last "compile"
-    #In the format Key:Data\n
-    info_file = open(file_path, 'r') 
+
+    # A data file holding info about the last "compile"
+    # In the format Key:Data\n
+    info_file = open(file_path, 'r')
     info = info_file.read()
     info_file.close()
 
-    info = info.split("\n") #Split the file into lines
+    info = info.split("\n")  # Split the file into lines
     for line in info:
-        packet = line.split(":") #Convert the file into a dict
-        if not line: #Damn new lines
+        packet = line.split(":")  # Convert the file into a dict
+        if not line:  # Damn new lines
             continue
         write_to[packet[0]] = str(packet[1])
-    
+
     return write_to
 
-#Converts a log file into a dict, in the format described above
+# Converts a log file into a dict, in the format described above
+
+
 def dict_to_log_file(dict):
     write_string = ""
     file_path = data_file
-    
+
     for key in dict:
         write_string += f"{key}:{dict[key]}\n"
-    
+
     write_string.strip("\n")
 
-    info_file = open(file_path, 'w') 
+    info_file = open(file_path, 'w')
     info_file.write(write_string)
     info_file.close()
 
-#Returns true if the two dicts match in terms of method, false otherwise
+# Returns true if the two dicts match in terms of method, false otherwise
+
+
 def compare_dict_methods(dict1, dict2, compare_by):
     for entry in compare_by:
         if entry not in dict1 and entry not in dict2:
             print(f"{entry} was in nothing, wtf")
             continue
-        #One file is newer then the other, do a full rerun
+        # One file is newer then the other, do a full rerun
         if entry not in dict1 or entry not in dict2:
             print(f"The dat file was outdated")
             return False
@@ -73,73 +83,82 @@ def compare_dict_methods(dict1, dict2, compare_by):
             return False
     return True
 
+
 def copy_dict_into_dict(copy_from, copy_into, keys_to_ignore):
     for key in copy_from:
         if key in keys_to_ignore:
             continue
         copy_into[key] = copy_from[key]
 
-#Modified binary search. check_function returns 1 if the first index is "larger" then the second, -1 if it's smaller, and 0 if they're the same
+# Modified binary search. check_function returns 1 if the first index is "larger" then the second, -1 if it's smaller, and 0 if they're the same
+
+
 def round_binary_search(arr, look_for):
     look_for = int(look_for)
     low = 0
     high = len(arr) - 1
     mid = 0
- 
+
     while low <= high:
- 
+
         mid = (high + low) // 2
 
-        properties = arr[mid].split("-") #This will get messy if you have a - in the system path
-        working_rnd_id = int(properties[1]) #Hopefully the  second line in this file is always the round's id
+        # This will get messy if you have a - in the system path
+        properties = arr[mid].split("-")
+        # Hopefully the  second line in this file is always the round's id
+        working_rnd_id = int(properties[1])
         if working_rnd_id < look_for:
             low = mid + 1
         elif working_rnd_id > look_for:
             high = mid - 1
         else:
             return mid
- 
+
     # If we reach here, then the element was not present
     return -1
 
+
 def file_binary_search(arr, look_for):
     look_for = int(look_for)
     low = 0
     high = len(arr) - 1
     mid = 0
- 
+
     while low <= high:
- 
+
         mid = (high + low) // 2
 
-        properties = arr[mid].split(",") #This will get messy if you have a - in the system path
-        working_rnd_id = int(properties[0]) #First line's always the id, right? RIGHT?
+        # This will get messy if you have a - in the system path
+        properties = arr[mid].split(",")
+        # First line's always the id, right? RIGHT?
+        working_rnd_id = int(properties[0])
         if working_rnd_id < look_for:
             low = mid + 1
         elif working_rnd_id > look_for:
             high = mid - 1
         else:
             return mid
-    
+
     if mid <= 0:
-        return mid #This is for the empty files, since you can't take away more then nothing can you
+        return mid  # This is for the empty files, since you can't take away more then nothing can you
 
     roundid = int(arr[mid].split(",")[0])
     lastmid = mid
-    #While we're greater then the target round id
+    # While we're greater then the target round id
     while roundid >= look_for:
-        if mid - 1 <= -1: #If this is the last item in the list give up
-            break    
-        lastmid = mid #Set lastmid to our current value
-        mid -= 1 #Lower mid by one
-        roundid = int(arr[mid].split(",")[0]) #Set roundid to the new value
-
-    #This will keep looping until we either hit the end, or go below the last round id
-    #Should prevent rounding issues with the binary search
- 
+        if mid - 1 <= -1:  # If this is the last item in the list give up
+            break
+        lastmid = mid  # Set lastmid to our current value
+        mid -= 1  # Lower mid by one
+        roundid = int(arr[mid].split(",")[0])  # Set roundid to the new value
+
+    # This will keep looping until we either hit the end, or go below the last round id
+    # Should prevent rounding issues with the binary search
+
     # If we reach here, then the element was not present
     return lastmid
 
+
 def make_list_into_string(headers):
     output = ""
     for header in headers:
@@ -148,6 +167,7 @@ def make_list_into_string(headers):
     output += "\n"
     return output
 
+
 def turn_dict_into_comma_seperated_string(dict_to_convert, headers):
     output = ""
     for key in headers:
@@ -156,10 +176,11 @@ def turn_dict_into_comma_seperated_string(dict_to_convert, headers):
     output += "\n"
     return output
 
+
 def recalculate_value(list, default_value, value_creator):
     current_val = list[0]
     first = list[1][0]
-    list[1].pop(0) #Remove the first item in the list
+    list[1].pop(0)  # Remove the first item in the list
     if first == current_val:
         holder = default_value
         for value in list[1]:
@@ -168,27 +189,29 @@ def recalculate_value(list, default_value, value_creator):
             holder = 0
         list[0] = holder
 
+
 def add_new_value(list, new_value, value_creator):
     list[0] = value_creator(new_value, list[0])
     list[1] += [new_value]
 
-#A dict of information about this run, used to determin if a full run is needed next time
+
+# A dict of information about this run, used to determin if a full run is needed next time
 data_log = {}
 
-tags_to_compare_with = ["backward_avg", "forward_avg", "backward_bound", "forward_bound", "starting_at", "highpass_threshold"]
+tags_to_compare_with = ["backward_avg", "forward_avg", "backward_bound","forward_bound", "starting_at", "highpass_threshold"]
 tags_to_leave_pure = tags_to_compare_with + ["last_round_fully_processed"]
-#A dict of information about the last run we did
+# A dict of information about the last run we did
 old_log = log_file_to_dict()
 
-#Modify these tochange the size of the moving average
-movingbackward = 50
-movingforward = 50
+# Modify these tochange the size of the moving average
+movingbackward = 30
+movingforward = 30
 total_moving_space = movingbackward + movingforward
 
 data_log["backward_avg"] = str(movingbackward)
 data_log["forward_avg"] = str(movingforward)
 
-#Modify these to effect the size of moving minimums and maximums. so how large should our bucket of items to min/max be basically
+# Modify these to effect the size of moving minimums and maximums. so how large should our bucket of items to min/max be basically
 boundbackward = 20
 boundforward = 20
 total_bound = boundbackward + boundforward
@@ -196,28 +219,29 @@ def add_new_value(list, new_value, value_creator):
 data_log["backward_bound"] = str(boundbackward)
 data_log["forward_bound"] = str(boundforward)
 
-#Knock on wood
+# Knock on wood
 data_log["last_round_fully_processed"] = 10000000000
 
-#A reminder of the farthest back you can go
+# A reminder of the farthest back you can go
 ON_THE_MORNING_OF_THE_FIRST_DAY = 150043
-#This is useful for making graphs that scale a little bit better, fucking carpets man
+# This is useful for making graphs that scale a little bit better, fucking carpets man
 PAST_CARPETS = 156000
 
-#What round id to start reading at
+# What round id to start reading at
 head_rnd = ON_THE_MORNING_OF_THE_FIRST_DAY
 data_log["starting_at"] = head_rnd
 
-highpass = 2.5 #Cuts out the pain stuff while still allowing the carpet bump to remain clear
+highpass = 2.5  # Cuts out the pain stuff while still allowing the carpet bump to remain clear
 data_log["highpass_threshold"] = highpass
 
 keys_to_average = ["maptick_to_player", "maptick", "players", "td", "td_to_player", "sendmaps_cost_per_tick", "per_client", "look_for_movable_changes", "check_turf_vis_conts", "check_hud/image_vis_contents", "turfs_in_range", "obj_changes", "mob_changes", "movables_examined"]
 
 input = glob.glob("output/*.csv")
 
-#The index to start reading at
+# The index to start reading at
 id_start_at = round_binary_search(input, head_rnd)
-preserve_old_files = compare_dict_methods(data_log, old_log, tags_to_compare_with)
+preserve_old_files = compare_dict_methods(
+    data_log, old_log, tags_to_compare_with)
 
 if preserve_old_files:
     round_start_at = old_log["last_round_fully_processed"]
@@ -229,14 +253,113 @@ def add_new_value(list, new_value, value_creator):
 for key in keys_to_average:
     fieldnames += [f"avg_{key}"]
     fieldnames += [f"min_{key}"]
-    fieldnames += [f"max_{key}"]  
+    fieldnames += [f"max_{key}"]
 
 fieldnames = ["id"] + fieldnames
 
-#I despise janitors 
-maps_we_care_about = ["Delta%20Station", "Ice%20Box%20Station", "Kilo%20Station", "MetaStation", "Tramstation"]
+# I despise janitors
+maps_we_care_about = ["Delta%20Station", "Ice%20Box%20Station",
+                      "Kilo%20Station", "MetaStation", "Tramstation"]
+
+# Dictionary of file names to dictionaries of data to be written later.
+data = {}
+
+# most processed stats are averages of two values, this just makes it easier to define
+
+
+def PROCESSED_STAT_AVERAGE(numerator, denominator, scaling_func): return [
+    numerator, denominator, scaling_func] if scaling_func else [numerator, denominator]
+
+# scaling_func = additional function to call on the fraction to scale it before returning
+
+
+def avg(numerator, denominator, scaling_func=to_microseconds):
+    if(denominator > 0):
+        return scaling_func(numerator / denominator)
+    else:
+        return 0
+
+class StatToken(enum.Enum):
+    USE_PREVIOUS_SIMPLE_STAGE = auto()
+    SELF = auto()
+
+# holder for data used to determine what stats to grab from the raw files and what to do with that data afterwards.
+# these dont actually do work themselves, they're just a helpful way to define a pipeline of raw data to processed statistics.
+# the actual work is done via lists / dictionaries created to hold the stats defined in instances of this class (and subtypes)
+class TrackedStat:
+    name = ""
 
-data = {} #Dictionary of file names to dictionaries of data to be written later.
+    # FIRST STAGE STATS (reading directly from rows, all defined stats at this stage go into first_stage_stats)
+
+    # the names of the stats we read from each row, each of these will be added to a cumulative value
+    # list of the form: [string exactly matching a stat grabbed from the row]
+    cumulative_raw_stats = []
+
+    # like cumulative_raw_stats, but they arent just added to with the value from each row, you can define how the stored value is changed with each read pass
+    # dictionary of the form: {string exactly matching a stat grabbed from the row : function reference to call each pass}
+    # you probably dont need this, it slows down reading
+    special_raw_stats = {}
+
+    # SECOND STAGE STATS (iterating over first stage stats, all defined stats at this stage go into second_stage_stats)
+
+    # stats that are averaged from two first stage stats
+    # dictionary of the form: {processed stat name (string) : [numerator stat read from rows, denominator stat read from rows, scaling function if not to_microseconds]}
+    # most second stage stats go in here
+    averaged_stats = {}
+
+    # like averaged_stats except you can define other functions to use
+    # dictionary of the form: {processed stat name (string) : [function to call to give this stat its value, additional arguments to give to that function]}
+    # if the arguments to give to the function are strings that match an existing stat name, the value associated with that stat is put in its place.
+    special_processed_stats = {}
+
+    # THIRD STAGE STATS (writing second and/or first stage stats to a file)
+
+    # dictionary of the form: {stat name string that gets written into the file : first or second stage stat to use}
+    write_stats = {}
+
+    # FOURTH AND FINAL STAGE STATS (averaging across rounds)
+
+    # values to average across rounds
+    cross_round_averaged_stats = []
+
+    # internal var used for linking to previous stages in instance declarations
+    _prev_stage_indices = [0, 0, 0, 0]
+
+    def __init__(self, 
+                name = "", 
+                cumulative_raw_stats = [], 
+                special_raw_stats = {}, 
+                averaged_stats = [], 
+                special_processed_stats = {}, 
+                write_stats = {}, 
+                cross_round_averaged_stats = []):
+
+        self.name = name
+        self.cumulative_raw_stats = cumulative_raw_stats
+        self.special_raw_stats = special_raw_stats
+
+        for key in averaged_stats:
+            for i in range(0, len(averaged_stats[key]) - 1):
+                argument = averaged_stats[key][i]
+                if argument == StatToken.SELF: 
+                    averaged_stats[key][i] = key
+
+        self.averaged_stats = averaged_stats
+        self.special_processed_stats = special_processed_stats
+
+        for key in write_stats:
+            if write_stats[key] == StatToken.SELF:
+                write_stats[key] = key
+                
+        self.write_stats = write_stats
+        self.cross_round_averaged_stats = cross_round_averaged_stats
+
+sendmaps_total = TrackedStat(
+    name="sendmaps_total",
+    cumulative_raw_stats=["sendmaps_total_cost", "sendmaps_total_calls"],
+    averaged_stats={"sendmaps_cost_per_tick": ["sendmaps_total_cost", "sendmaps_total_calls"]},
+    write_stats={"sendmaps_cost_per_tick" : StatToken.SELF}, #associating it with Self makes __init__() associate the value with the key
+    cross_round_averaged_stats=["sendmaps_cost_per_tick"])
 
 # first pass of data parsing: populate the data dictionary with info
 # for all round ids we've not ingested before
@@ -247,45 +370,65 @@ def add_new_value(list, new_value, value_creator):
     player_total = 0
     td_total = 0
 
-    sendmaps_total_cost = 0 #all of these only use the last rows data which is the real total for that round
-    sendmaps_total_calls = 0
+    stats = {}
+
+    cumulative_raw_stats = []
+    special_raw_stats = {}
+
+    first_stage_stats = {}
+
+    # all of these only use the last rows data which is the real total for that round
+    stats["sendmaps_total_cost"] = 0
+    stats["sendmaps_total_calls"] = 0
 
-    sendmaps_client_cost = 0
-    sendmaps_client_calls = 0
+    stats["sendmaps_client_cost"] = 0
+    stats["sendmaps_client_calls"] = 0
 
-    movable_changes_cost = 0
-    movable_changes_calls = 0
+    stats["movable_changes_cost"] = 0
+    stats["movable_changes_calls"] = 0
 
-    check_turf_vis_contents_cost = 0
-    check_turf_vis_contents_calls = 0
+    stats["check_turf_vis_contents_cost"] = 0
+    stats["check_turf_vis_contents_calls"] = 0
 
-    check_hud_image_vis_contents_cost = 0
-    check_hud_image_vis_contents_calls = 0
+    stats["check_hud_image_vis_contents_cost"] = 0
+    stats["check_hud_image_vis_contents_calls"] = 0
 
-    loop_turfs_in_range_cost = 0
-    loop_turfs_in_range_calls = 0
+    stats["loop_turfs_in_range_cost"] = 0
+    stats["loop_turfs_in_range_calls"] = 0
 
-    obj_changes_cost = 0
-    obj_changes_calls = 0
+    stats["obj_changes_cost"] = 0
+    stats["obj_changes_calls"] = 0
 
-    mob_changes_cost = 0
-    mob_changes_calls = 0
+    stats["mob_changes_cost"] = 0
+    stats["mob_changes_calls"] = 0
 
-    movables_examined = 0
+    stats["movables_examined"] = 0
 
     has_sendmaps_profiler_logs = False
 
     csvfile = open(f_name, newline='')
     reader = csv.DictReader(csvfile)
-    #read all the data 
+
+    get_row = lambda row, row_stat, null_val=0: float(row.get(row_stat) or null_val)
+
+    # read all the data
     for row in reader:
         lines_read += 1
-        maptick_total += float(row["maptick"])
+        for stat_to_add in cumulative_raw_stats:
+            first_stage_stats[stat_to_add] = get_row(row, stat_to_add)
+
+        for special_stat in special_raw_stats:
+            func = special_raw_stats[special_stat]
+            first_stage_stats[special_stat] = func(get_row(row, special_stat), first_stage_stats[special_stat])
+
+        maptick_total += get_row(row, "maptick")
         player_total += float(row["players"])
-        td_total += float(row["tidi_avg"]) 
+        td_total += float(row["tidi_avg"])
 
-        sendmaps_total_cost = float(row.get("send_maps") or 0)#the last row read is the final value for these
-        sendmaps_total_calls = float(row.get("send_maps_count") or 0)#have to use .get(index) or 0 because not all logs have these indices
+        # the last row read is the final value for these
+        sendmaps_total_cost = float(row.get("send_maps") or 0)
+        # have to use .get(index) or 0 because not all logs have these indices
+        sendmaps_total_calls = float(row.get("send_maps_count") or 0)
         if sendmaps_total_cost != 0.0:
             has_sendmaps_profiler_logs = True
 
@@ -314,33 +457,38 @@ def add_new_value(list, new_value, value_creator):
 
     csvfile.close()
 
-    #In the template perf-[roundid]-[mapname]-[servername].csv
-    file_without_ending = f_name.split(".")[0] 
-    properties = file_without_ending.split("-") #This will get messy if you have a - in the system path
+    # In the template perf-[roundid]-[mapname]-[servername].csv
+    file_without_ending = f_name.split(".")[0]
+    # This will get messy if you have a - in the system path
+    properties = file_without_ending.split("-")
     if len(properties) < 3:
         print(f"ERROR: [{f_name}] Is being improperly parsed")
-    id = properties[1] #The second item in this list should be id
-    map = properties[2] #The third item is the map name
-    server = properties[3] #Fourth term's the server this round came from, we'll need that soon
+    id = properties[1]  # The second item in this list should be id
+    map = properties[2]  # The third item is the map name
+    # Fourth term's the server this round came from, we'll need that soon
+    server = properties[3]
 
     if not id.isnumeric():
         print("Found a non numeric round id, [id], skipping")
         continue
 
-    #There was a short period where we were parsing byond's maptick values incorrectly.
-    #This lead to irrecovorably broken logs. This check exists to handle them
-    #Let's try not to add any more yeah?
+    # There was a short period where we were parsing byond's maptick values incorrectly.
+    # This lead to irrecovorably broken logs. This check exists to handle them
+    # Let's try not to add any more yeah?
     intid = int(id)
     if intid >= 164722 and intid <= 164824:
-        continue 
-    
+        continue
+
     maptick_by_players = 0
     td_by_players = 0
     avg_maptick = 0
     avg_players = 0
     avg_td = 0
 
-    sendmaps_cost_per_tick = 0 #absolute cost values: either milliseconds, microseconds, or total movables examined
+    averages = {}
+
+    # absolute cost values: either milliseconds, microseconds, or total movables examined
+    sendmaps_cost_per_tick = 0
     sendmaps_clients = 0
     avg_cost_per_client = 0
     avg_cost_movable_changes = 0
@@ -351,13 +499,16 @@ def add_new_value(list, new_value, value_creator):
     avg_cost_mob_changes = 0
     avg_movables_examined = 0
 
+    def average_if_valid(numerator, denominator): return to_microseconds(
+        numerator / denominator) if denominator > 0 else 0
+
     if has_sendmaps_profiler_logs:
-        #the cost vars are always in seconds which makes most of them very small. converting to microseconds is much better
-        sendmaps_cost_per_tick = to_microseconds(sendmaps_total_cost / sendmaps_total_calls)
-        sendmaps_clients = sendmaps_client_calls / sendmaps_total_calls 
+        # the cost vars are always in seconds which makes most of them very small. converting to microseconds is much better
+        sendmaps_cost_per_tick = to_microseconds(
+            sendmaps_total_cost / sendmaps_total_calls)
+        sendmaps_clients = sendmaps_client_calls / sendmaps_total_calls
 
-        if sendmaps_client_calls:
-            avg_cost_per_client = to_microseconds(sendmaps_total_cost / sendmaps_client_calls)
+        avg_cost_per_client = average_if_valid(sendmaps_total_cost, sendmaps_client_calls)
         if movable_changes_calls:
             avg_cost_movable_changes = to_microseconds(movable_changes_cost / movable_changes_calls)
         if check_turf_vis_contents_calls:
@@ -369,7 +520,8 @@ def add_new_value(list, new_value, value_creator):
         if obj_changes_calls:
             avg_cost_obj_changes = to_microseconds(obj_changes_cost / obj_changes_calls)
         if mob_changes_calls:
-            avg_cost_mob_changes = to_microseconds(mob_changes_cost / mob_changes_calls)
+            avg_cost_mob_changes = to_microseconds(
+                mob_changes_cost / mob_changes_calls)
         if sendmaps_client_calls:
             avg_movables_examined = movables_examined / sendmaps_client_calls
 
@@ -381,19 +533,19 @@ def add_new_value(list, new_value, value_creator):
         avg_players = player_total / lines_read
         avg_td = td_total / lines_read
 
-    #finalize our data collection by map, server, and generic single stat files
+    # finalize our data collection by map, server, and generic single stat files
     pending = [map, server, "maptick", "highpass_maptick"]
     for index in pending:
-        if index not in data: #If one doesn't already exist, make a new list to put our map data into
+        if index not in data:  # If one doesn't already exist, make a new list to put our map data into
             data[index] = []
         if index == "highpass_maptick" and (maptick_by_players > highpass):
             continue
         to_write = {}
-        
+
         to_write["id"] = id
         to_write["maptick_to_player"] = maptick_by_players
         to_write["maptick"] = avg_maptick
-        to_write["players"] = avg_players 
+        to_write["players"] = avg_players
         to_write["td"] = avg_td
 
         if td_by_players > 1.2:
@@ -414,64 +566,70 @@ def add_new_value(list, new_value, value_creator):
 
     print(f"Read [{id}] [{map}] [{server}]")
 
-#Now that we've done a first pass, we need to go back over things again 
-#These are all the file names that need operating on
+# Now that we've done a first pass, we need to go back over things again
+# These are all the file names that need operating on
 for index in data:
     working_list = data[index]
-    #Before you open it for writing, if we're working from a starting point, write all the untouched lines into the cache
+    # Before you open it for writing, if we're working from a starting point, write all the untouched lines into the cache
     write_to_file = ""
-    
+
     write_to_file += make_list_into_string(fieldnames)
 
     key = f"last_round_fully_processed_{index}"
-    #Preps existing csv files for our new input, careful this gets messy fast
+    # Preps existing csv files for our new input, careful this gets messy fast
     if preserve_old_files and id_start_at and key in old_log:
         round_start_at = old_log[key]
-        
-        round_start_at = min(int(round_start_at), int(old_log["last_round_fully_processed"]))
+
+        round_start_at = min(int(round_start_at), int(
+            old_log["last_round_fully_processed"]))
         read_from = open(f"{output_loc}{index}.csv", 'r')
-        
+
         file_contents = read_from.read()
         read_from.close()
 
         file_contents = file_contents.strip("\n")
 
         file_contents = file_contents.split("\n")
-        file_contents = file_contents[1:]#Get rid of the first line, which should just be the headers
+        # Get rid of the first line, which should just be the headers
+        file_contents = file_contents[1:]
 
         last_sane_round = file_binary_search(file_contents, round_start_at)
         if last_sane_round > 0:
-            file_contents = file_contents[:last_sane_round + 1] #Cut out the entries we're going to touch
+            # Cut out the entries we're going to touch
+            file_contents = file_contents[:last_sane_round + 1]
             write_to_file += "\n".join(file_contents)
 
-    length_of_rows = len(working_list) - 1 # If there's one item, I want this to be 0
-    
-    #These two dicts are key -> list[interested value, [list of members]]
+    # If there's one item, I want this to be 0
+    length_of_rows = len(working_list) - 1
+
+    # These two dicts are key -> list[interested value, [list of members]]
     local_min = {}
     local_max = {}
     for key_type in keys_to_average:
         local_min[key_type] = [MAX, []]
-        local_max[key_type] = [0, []] 
+        local_max[key_type] = [0, []]
 
     for i in range(length_of_rows):
         row = working_list[i]
-            
+
         look_behind = i - movingbackward
         look_ahead = i + movingforward
         do_not_remove = False
         do_not_add = False
 
-        #Wrapping, this is why there's those flat lines at the edges of the graph
+        # Wrapping, this is why there's those flat lines at the edges of the graph
         if look_behind < 0:
-            delta_behind = abs(look_behind) #delta will be the remainder of look_ahead
+            # delta will be the remainder of look_ahead
+            delta_behind = abs(look_behind)
             look_behind = 0
-            look_ahead = min(look_ahead + delta_behind, length_of_rows)     
+            look_ahead = min(look_ahead + delta_behind, length_of_rows)
 
         if look_ahead > length_of_rows:
-            delta_ahead = look_ahead - length_of_rows #delta will be the remainder of look_behind
+            # delta will be the remainder of look_behind
+            delta_ahead = look_ahead - length_of_rows
             look_ahead = length_of_rows
-            look_behind = max(look_behind - delta_ahead, 0)     
-        
+            look_behind = max(look_behind - delta_ahead, 0)
+
         if i - boundforward < 0:
             do_not_add = True
 
@@ -479,7 +637,7 @@ def add_new_value(list, new_value, value_creator):
             do_not_remove = True
 
         totals = {}
-        
+
         for key_type in keys_to_average:
             totals[key_type] = 0
 
@@ -492,32 +650,35 @@ def add_new_value(list, new_value, value_creator):
 
             if do_not_add:
                 continue
-            
+
             newest_val = data[index][i][key_type]
             add_new_value(min_list, newest_val, min)
             add_new_value(max_list, newest_val, max)
 
-        for ii in range(look_behind, look_ahead): #Look through them all
+        for ii in range(look_behind, look_ahead):  # Look through them all
             look_at = data[index][ii]
             for key_type in keys_to_average:
                 totals[key_type] += look_at[key_type]
 
-        total_read = (look_ahead - look_behind) + 1 #Add 1 so reading one line doesn't read an average of 0
-        
+        # Add 1 so reading one line doesn't read an average of 0
+        total_read = (look_ahead - look_behind) + 1
+
         for key_type in keys_to_average:
             row[f"avg_{key_type}"] = totals[key_type] / total_read
             row[f"min_{key_type}"] = local_min[key_type][0]
-            row[f"max_{key_type}"] = local_max[key_type][0]        
+            row[f"max_{key_type}"] = local_max[key_type][0]
 
         write_to_file += turn_dict_into_comma_seperated_string(row, fieldnames)
 
         rnd_id = row["id"]
         print(f"Write [{index}] [{i}] [{rnd_id}]")
 
-    last_good_subset_round = working_list[-min(len(working_list), total_moving_space)]["id"]
+    last_good_subset_round = working_list[-min(
+        len(working_list), total_moving_space)]["id"]
     data_log[key] = last_good_subset_round
     if index in maps_we_care_about:
-        data_log["last_round_fully_processed"] = min(int(last_good_subset_round), int(data_log["last_round_fully_processed"]))
+        data_log["last_round_fully_processed"] = min(
+            int(last_good_subset_round), int(data_log["last_round_fully_processed"]))
 
     output = open(f"{output_loc}{index}.csv", 'w')
     output.write(write_to_file)
diff --git a/root/SingleRound.py b/root/SingleRound.py
index a9da736..2996c80 100644
--- a/root/SingleRound.py
+++ b/root/SingleRound.py
@@ -3,10 +3,6 @@
 import sys
 import subprocess
 import os.path
-
-#output_loc = "maptick/"
-#if not os.path.exists(output_loc):
-#    os.makedir(output_loc)
     
 output_to = "single_round/temporary"
 read_from = "output/"
diff --git a/root/maptick_plot.gnuplot b/root/maptick_plot.gnuplot
index 73ab819..0981d8f 100644
--- a/root/maptick_plot.gnuplot
+++ b/root/maptick_plot.gnuplot
@@ -33,7 +33,6 @@ filename = sprintf("%s%s", outputfolder, filename)
 outputfile13 = sprintf("%s Average%s", filename, outputformat)
 outputfile14 = sprintf("%s Average By Map%s", filename, outputformat)
 outputfile15 = sprintf("%s Average By Server%s", filename, outputformat)
-#outputfile16 = sprintf("%s Average%s", filename, outputformat)
 
 set key autotitle columnheader 
 set key noenhanced

From 79429e2a8b2fb9e2c8d8d8020b8e5aebae3fd674 Mon Sep 17 00:00:00 2001
From: KylerAce <kylerlumpkin1@gmail.com>
Date: Mon, 3 Apr 2023 00:58:50 -0700
Subject: [PATCH 4/5] is this thing on

---
 root/MaptickAverager.py | 304 ++++++++--------------------------------
 1 file changed, 62 insertions(+), 242 deletions(-)

diff --git a/root/MaptickAverager.py b/root/MaptickAverager.py
index 83f5dda..fca2d3f 100644
--- a/root/MaptickAverager.py
+++ b/root/MaptickAverager.py
@@ -90,9 +90,6 @@ def copy_dict_into_dict(copy_from, copy_into, keys_to_ignore):
             continue
         copy_into[key] = copy_from[key]
 
-# Modified binary search. check_function returns 1 if the first index is "larger" then the second, -1 if it's smaller, and 0 if they're the same
-
-
 def round_binary_search(arr, look_for):
     look_for = int(look_for)
     low = 0
@@ -264,103 +261,6 @@ def add_new_value(list, new_value, value_creator):
 # Dictionary of file names to dictionaries of data to be written later.
 data = {}
 
-# most processed stats are averages of two values, this just makes it easier to define
-
-
-def PROCESSED_STAT_AVERAGE(numerator, denominator, scaling_func): return [
-    numerator, denominator, scaling_func] if scaling_func else [numerator, denominator]
-
-# scaling_func = additional function to call on the fraction to scale it before returning
-
-
-def avg(numerator, denominator, scaling_func=to_microseconds):
-    if(denominator > 0):
-        return scaling_func(numerator / denominator)
-    else:
-        return 0
-
-class StatToken(enum.Enum):
-    USE_PREVIOUS_SIMPLE_STAGE = auto()
-    SELF = auto()
-
-# holder for data used to determine what stats to grab from the raw files and what to do with that data afterwards.
-# these dont actually do work themselves, they're just a helpful way to define a pipeline of raw data to processed statistics.
-# the actual work is done via lists / dictionaries created to hold the stats defined in instances of this class (and subtypes)
-class TrackedStat:
-    name = ""
-
-    # FIRST STAGE STATS (reading directly from rows, all defined stats at this stage go into first_stage_stats)
-
-    # the names of the stats we read from each row, each of these will be added to a cumulative value
-    # list of the form: [string exactly matching a stat grabbed from the row]
-    cumulative_raw_stats = []
-
-    # like cumulative_raw_stats, but they arent just added to with the value from each row, you can define how the stored value is changed with each read pass
-    # dictionary of the form: {string exactly matching a stat grabbed from the row : function reference to call each pass}
-    # you probably dont need this, it slows down reading
-    special_raw_stats = {}
-
-    # SECOND STAGE STATS (iterating over first stage stats, all defined stats at this stage go into second_stage_stats)
-
-    # stats that are averaged from two first stage stats
-    # dictionary of the form: {processed stat name (string) : [numerator stat read from rows, denominator stat read from rows, scaling function if not to_microseconds]}
-    # most second stage stats go in here
-    averaged_stats = {}
-
-    # like averaged_stats except you can define other functions to use
-    # dictionary of the form: {processed stat name (string) : [function to call to give this stat its value, additional arguments to give to that function]}
-    # if the arguments to give to the function are strings that match an existing stat name, the value associated with that stat is put in its place.
-    special_processed_stats = {}
-
-    # THIRD STAGE STATS (writing second and/or first stage stats to a file)
-
-    # dictionary of the form: {stat name string that gets written into the file : first or second stage stat to use}
-    write_stats = {}
-
-    # FOURTH AND FINAL STAGE STATS (averaging across rounds)
-
-    # values to average across rounds
-    cross_round_averaged_stats = []
-
-    # internal var used for linking to previous stages in instance declarations
-    _prev_stage_indices = [0, 0, 0, 0]
-
-    def __init__(self, 
-                name = "", 
-                cumulative_raw_stats = [], 
-                special_raw_stats = {}, 
-                averaged_stats = [], 
-                special_processed_stats = {}, 
-                write_stats = {}, 
-                cross_round_averaged_stats = []):
-
-        self.name = name
-        self.cumulative_raw_stats = cumulative_raw_stats
-        self.special_raw_stats = special_raw_stats
-
-        for key in averaged_stats:
-            for i in range(0, len(averaged_stats[key]) - 1):
-                argument = averaged_stats[key][i]
-                if argument == StatToken.SELF: 
-                    averaged_stats[key][i] = key
-
-        self.averaged_stats = averaged_stats
-        self.special_processed_stats = special_processed_stats
-
-        for key in write_stats:
-            if write_stats[key] == StatToken.SELF:
-                write_stats[key] = key
-                
-        self.write_stats = write_stats
-        self.cross_round_averaged_stats = cross_round_averaged_stats
-
-sendmaps_total = TrackedStat(
-    name="sendmaps_total",
-    cumulative_raw_stats=["sendmaps_total_cost", "sendmaps_total_calls"],
-    averaged_stats={"sendmaps_cost_per_tick": ["sendmaps_total_cost", "sendmaps_total_calls"]},
-    write_stats={"sendmaps_cost_per_tick" : StatToken.SELF}, #associating it with Self makes __init__() associate the value with the key
-    cross_round_averaged_stats=["sendmaps_cost_per_tick"])
-
 # first pass of data parsing: populate the data dictionary with info
 # for all round ids we've not ingested before
 for index in range(id_start_at, len(input)):
@@ -370,90 +270,57 @@ def __init__(self,
     player_total = 0
     td_total = 0
 
-    stats = {}
-
-    cumulative_raw_stats = []
-    special_raw_stats = {}
-
-    first_stage_stats = {}
-
-    # all of these only use the last rows data which is the real total for that round
-    stats["sendmaps_total_cost"] = 0
-    stats["sendmaps_total_calls"] = 0
-
-    stats["sendmaps_client_cost"] = 0
-    stats["sendmaps_client_calls"] = 0
-
-    stats["movable_changes_cost"] = 0
-    stats["movable_changes_calls"] = 0
-
-    stats["check_turf_vis_contents_cost"] = 0
-    stats["check_turf_vis_contents_calls"] = 0
-
-    stats["check_hud_image_vis_contents_cost"] = 0
-    stats["check_hud_image_vis_contents_calls"] = 0
-
-    stats["loop_turfs_in_range_cost"] = 0
-    stats["loop_turfs_in_range_calls"] = 0
-
-    stats["obj_changes_cost"] = 0
-    stats["obj_changes_calls"] = 0
-
-    stats["mob_changes_cost"] = 0
-    stats["mob_changes_calls"] = 0
-
-    stats["movables_examined"] = 0
-
     has_sendmaps_profiler_logs = False
 
     csvfile = open(f_name, newline='')
     reader = csv.DictReader(csvfile)
 
-    get_row = lambda row, row_stat, null_val=0: float(row.get(row_stat) or null_val)
+    #raw_rows = csvfile.readlines()
+    #rows_with_fields = dict(zip(reader.fieldnames, raw_rows))
+
+    get_value = lambda row, row_stat, null_val=0: float(row.get(row_stat) or null_val) if row != None else null_val
+
+    last_row = None
 
     # read all the data
     for row in reader:
         lines_read += 1
-        for stat_to_add in cumulative_raw_stats:
-            first_stage_stats[stat_to_add] = get_row(row, stat_to_add)
-
-        for special_stat in special_raw_stats:
-            func = special_raw_stats[special_stat]
-            first_stage_stats[special_stat] = func(get_row(row, special_stat), first_stage_stats[special_stat])
+        last_row = row.copy()
 
-        maptick_total += get_row(row, "maptick")
-        player_total += float(row["players"])
-        td_total += float(row["tidi_avg"])
+        maptick_total += get_value(row, "maptick")
+        player_total += get_value(row, "players")
+        td_total += get_value(row, "tidi_avg")
 
-        # the last row read is the final value for these
-        sendmaps_total_cost = float(row.get("send_maps") or 0)
-        # have to use .get(index) or 0 because not all logs have these indices
-        sendmaps_total_calls = float(row.get("send_maps_count") or 0)
-        if sendmaps_total_cost != 0.0:
-            has_sendmaps_profiler_logs = True
+    # the last row read is the final value for these
+    sendmaps_total_cost = get_value(last_row, "send_maps")
+    # have to use .get(index) or 0 because not all logs have these indices
+    sendmaps_total_calls = get_value(last_row, "send_maps_count")
+    if sendmaps_total_cost != 0.0:
+        has_sendmaps_profiler_logs = True
+        print("has_sendmaps_profiler_logs = True")
 
-        sendmaps_client_cost = float(row.get("per_client") or 0)
-        sendmaps_client_calls = float(row.get("per_client_count") or 0)
+    sendmaps_client_cost = get_value(last_row, "per_client")
+    sendmaps_client_calls = get_value(last_row, "per_client_count")
 
-        movable_changes_cost = float(row.get("look_for_movable_changes") or 0)
-        movable_changes_calls = float(row.get("look_for_movable_changes_count") or 0)
+    movable_changes_cost = get_value(last_row, "look_for_movable_changes")
+    movable_changes_calls = get_value(last_row, "look_for_movable_changes_count")
 
-        check_turf_vis_contents_cost = float(row.get("check_turf_vis_conts") or 0)
-        check_turf_vis_contents_calls = float(row.get("check_turf_vis_conts_count") or 0)
+    check_turf_vis_contents_cost = get_value(last_row, "check_turf_vis_conts")
+    check_turf_vis_contents_calls = get_value(last_row, "check_turf_vis_conts_count")
 
-        check_hud_image_vis_contents_cost = float(row.get("check_hud/image_vis_contents") or 0)
-        check_hud_image_vis_contents_calls = float(row.get("check_hud/image_vis_contents_count") or 0)
+    check_hud_image_vis_contents_cost = get_value(last_row, "check_hud/image_vis_contents")
+    check_hud_image_vis_contents_calls = get_value(last_row, "check_hud/image_vis_contents_count")
 
-        loop_turfs_in_range_cost = float(row.get("turfs_in_range") or 0)
-        loop_turfs_in_range_calls = float(row.get("turfs_in_range_count") or 0)
+    loop_turfs_in_range_cost = get_value(last_row, "turfs_in_range")
+    loop_turfs_in_range_calls = get_value(last_row, "turfs_in_range_count")
 
-        obj_changes_cost = float(row.get("obj_changes") or 0)
-        obj_changes_calls = float(row.get("obj_changes_count") or 0)
+    obj_changes_cost = get_value(last_row, "obj_changes")
+    obj_changes_calls = get_value(last_row, "obj_changes_count")
 
-        mob_changes_cost = float(row.get("mob_changes") or 0)
-        mob_changes_calls = float(row.get("mob_changes_count") or 0)
+    mob_changes_cost = get_value(last_row, "mob_changes")
+    mob_changes_calls = get_value(last_row, "mob_changes_count")
 
-        movables_examined = float(row.get("movables_examined") or 0)
+    movables_examined = get_value(last_row, "movables_examined")
 
     csvfile.close()
 
@@ -479,90 +346,43 @@ def __init__(self,
     if intid >= 164722 and intid <= 164824:
         continue
 
-    maptick_by_players = 0
-    td_by_players = 0
-    avg_maptick = 0
-    avg_players = 0
-    avg_td = 0
-
-    averages = {}
-
-    # absolute cost values: either milliseconds, microseconds, or total movables examined
-    sendmaps_cost_per_tick = 0
-    sendmaps_clients = 0
-    avg_cost_per_client = 0
-    avg_cost_movable_changes = 0
-    avg_cost_turf_vis_contents = 0
-    avg_cost_hud_image_vis_contents = 0
-    avg_cost_turfs_in_range = 0
-    avg_cost_obj_changes = 0
-    avg_cost_mob_changes = 0
-    avg_movables_examined = 0
-
-    def average_if_valid(numerator, denominator): return to_microseconds(
-        numerator / denominator) if denominator > 0 else 0
-
-    if has_sendmaps_profiler_logs:
-        # the cost vars are always in seconds which makes most of them very small. converting to microseconds is much better
-        sendmaps_cost_per_tick = to_microseconds(
-            sendmaps_total_cost / sendmaps_total_calls)
-        sendmaps_clients = sendmaps_client_calls / sendmaps_total_calls
-
-        avg_cost_per_client = average_if_valid(sendmaps_total_cost, sendmaps_client_calls)
-        if movable_changes_calls:
-            avg_cost_movable_changes = to_microseconds(movable_changes_cost / movable_changes_calls)
-        if check_turf_vis_contents_calls:
-            avg_cost_turf_vis_contents = to_microseconds(check_turf_vis_contents_cost / check_turf_vis_contents_calls)
-        if check_hud_image_vis_contents_calls:
-            avg_cost_hud_image_vis_contents = to_microseconds(check_hud_image_vis_contents_cost / check_hud_image_vis_contents_calls)
-        if loop_turfs_in_range_calls:
-            avg_cost_turfs_in_range = to_microseconds(loop_turfs_in_range_cost / loop_turfs_in_range_calls)
-        if obj_changes_calls:
-            avg_cost_obj_changes = to_microseconds(obj_changes_cost / obj_changes_calls)
-        if mob_changes_calls:
-            avg_cost_mob_changes = to_microseconds(
-                mob_changes_cost / mob_changes_calls)
-        if sendmaps_client_calls:
-            avg_movables_examined = movables_examined / sendmaps_client_calls
-
-    if player_total:
-        maptick_by_players = maptick_total / player_total
-        td_by_players = td_total / player_total
-    if lines_read:
-        avg_maptick = maptick_total / lines_read
-        avg_players = player_total / lines_read
-        avg_td = td_total / lines_read
+    def average_if_valid(numerator, denominator): return numerator / denominator if denominator > 0 else 0
+    def average_if_exists(numerator, denominator): return average_if_valid(numerator, denominator) if has_sendmaps_profiler_logs == True else 0
+
+    td_per_player = average_if_exists(td_total, player_total)
+    if td_per_player > 1.2:
+        td_per_player = 0.6
+
+    to_write = {}
+
+    to_write["id"] = id
+    to_write["maptick_to_player"] = average_if_valid(maptick_total, player_total)
+    to_write["maptick"] = average_if_valid(maptick_total, lines_read)
+    to_write["players"] = average_if_valid(player_total, lines_read)
+    to_write["td"] = average_if_exists(td_total, lines_read)
+    
+    to_write["td_to_player"] = td_per_player
+
+    to_write["sendmaps_cost_per_tick"] = to_microseconds(average_if_exists(sendmaps_total_cost, sendmaps_total_calls))
+    to_write["per_client"] = to_microseconds(average_if_exists(sendmaps_client_cost, sendmaps_client_calls))
+    to_write["look_for_movable_changes"] = to_microseconds(average_if_exists(movable_changes_cost, movable_changes_calls))
+    to_write["check_turf_vis_conts"] = to_microseconds(average_if_exists(check_turf_vis_contents_cost, check_turf_vis_contents_calls))
+    to_write["check_hud/image_vis_contents"] = to_microseconds(average_if_exists(check_hud_image_vis_contents_cost, check_hud_image_vis_contents_calls))
+    to_write["turfs_in_range"] = to_microseconds(average_if_exists(loop_turfs_in_range_cost, loop_turfs_in_range_calls))
+    to_write["obj_changes"] = to_microseconds(average_if_exists(obj_changes_cost, obj_changes_calls))
+    to_write["mob_changes"] = to_microseconds(average_if_exists(mob_changes_cost, mob_changes_calls))
+    to_write["movables_examined"] = average_if_exists(movables_examined, sendmaps_client_calls)
 
     # finalize our data collection by map, server, and generic single stat files
     pending = [map, server, "maptick", "highpass_maptick"]
     for index in pending:
         if index not in data:  # If one doesn't already exist, make a new list to put our map data into
             data[index] = []
-        if index == "highpass_maptick" and (maptick_by_players > highpass):
+        if index == "highpass_maptick" and (to_write["maptick_to_player"] > highpass):
             continue
-        to_write = {}
-
-        to_write["id"] = id
-        to_write["maptick_to_player"] = maptick_by_players
-        to_write["maptick"] = avg_maptick
-        to_write["players"] = avg_players
-        to_write["td"] = avg_td
-
-        if td_by_players > 1.2:
-            td_by_players = 0.6
-        to_write["td_to_player"] = td_by_players
-
-        to_write["sendmaps_cost_per_tick"] = sendmaps_cost_per_tick
-        to_write["per_client"] = avg_cost_per_client
-        to_write["look_for_movable_changes"] = avg_cost_movable_changes
-        to_write["check_turf_vis_conts"] = avg_cost_turf_vis_contents
-        to_write["check_hud/image_vis_contents"] = avg_cost_hud_image_vis_contents
-        to_write["turfs_in_range"] = avg_cost_turfs_in_range
-        to_write["obj_changes"] = avg_cost_obj_changes
-        to_write["mob_changes"] = avg_cost_mob_changes
-        to_write["movables_examined"] = avg_movables_examined
-
-        data[index].append(to_write)
+        
+        #print(to_write.copy())
+        data[index].append(to_write.copy())
 
     print(f"Read [{id}] [{map}] [{server}]")
 

From 2d483c445825c6d96b71d4c4778ea0a02732fc54 Mon Sep 17 00:00:00 2001
From: KylerAce <kylerlumpkin1@gmail.com>
Date: Mon, 3 Apr 2023 02:16:42 -0700
Subject: [PATCH 5/5] diff fixes

---
 root/MaptickAverager.py | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/root/MaptickAverager.py b/root/MaptickAverager.py
index fca2d3f..da81d9d 100644
--- a/root/MaptickAverager.py
+++ b/root/MaptickAverager.py
@@ -3,8 +3,6 @@
 import os
 import os.path
 import sys
-import enum
-from enum import auto
 
 MAX = sys.float_info.max
 
@@ -297,7 +295,6 @@ def add_new_value(list, new_value, value_creator):
     sendmaps_total_calls = get_value(last_row, "send_maps_count")
     if sendmaps_total_cost != 0.0:
         has_sendmaps_profiler_logs = True
-        print("has_sendmaps_profiler_logs = True")
 
     sendmaps_client_cost = get_value(last_row, "per_client")
     sendmaps_client_calls = get_value(last_row, "per_client_count")