From da4c2d7cec65313f5617b08ce68ace63bd74c1aa Mon Sep 17 00:00:00 2001
From: Frank Sabates <73601477+FrankS-2024@users.noreply.github.com>
Date: Sat, 24 Jan 2026 18:00:28 -0800
Subject: [PATCH] Use symmetric sine axis labels

---
 Images/spark_demo_output.svg   |  11 ++++
 Images/spark_pointstat_avg.svg |   9 +++
 Images/spark_pointstat_max.svg |   9 +++
 SparK.py                       | 113 +++++++++++++++++----------------
 4 files changed, 89 insertions(+), 53 deletions(-)
 create mode 100644 Images/spark_demo_output.svg
 create mode 100644 Images/spark_pointstat_avg.svg
 create mode 100644 Images/spark_pointstat_max.svg
diff --git a/Images/spark_demo_output.svg b/Images/spark_demo_output.svg
new file mode 100644
index 0000000..1023cb6
--- /dev/null
+++ b/Images/spark_demo_output.svg
@@ -0,0 +1,11 @@
+<svg style="background:#ffffff" viewBox="0 0 320 210.0" xmlns="http://www.w3.org/2000/svg">
+<polygon points="50.0,100.0 53.0,106.75 56.0,108.496 59.0,108.496 62.0,110.125 65.0,110.125 68.0,111.52 71.0,111.52 74.0,112.6 77.0,112.6 80.0,113.266 83.0,113.266 86.0,113.5 89.0,113.5 92.0,113.266 95.0,113.266 98.0,112.6 101.0,112.6 104.0,111.52 107.0,111.52 110.0,110.125 113.0,110.125 116.0,108.496 119.0,108.496 122.0,106.75 125.0,106.75 128.0,105.004 131.0,105.004 134.0,103.375 137.0,103.375 140.0,101.98 143.0,101.98 146.0,100.9 149.0,100.9 152.0,100.234 155.0,100.234 158.0,100.0 161.0,100.0 164.0,100.234 167.0,100.234 170.0,100.9 173.0,100.9 176.0,101.98 179.0,101.98 182.0,103.375 185.0,103.375 188.0,105.004 191.0,105.004 194.0,106.75 197.0,100.0" opacity="0.6" fill="#FF1800" stroke="black" stroke-width="0"/>
+<polygon points="50.0,100.0 53.0,86.5 56.0,83.008 59.0,83.008 62.0,79.75 65.0,79.75 68.0,76.951 71.0,76.951 74.0,74.809 77.0,74.809 80.0,73.459 83.0,73.459 86.0,73.0 89.0,73.0 92.0,73.459 95.0,73.459 98.0,74.809 101.0,74.809 104.0,76.951 107.0,76.951 110.0,79.75 113.0,79.75 116.0,83.008 119.0,83.008 122.0,86.5 125.0,86.5 128.0,89.992 131.0,89.992 134.0,93.25 137.0,93.25 140.0,96.049 143.0,96.049 146.0,98.191 149.0,98.191 152.0,99.541 155.0,99.541 158.0,100.0 161.0,100.0 164.0,99.541 167.0,99.541 170.0,98.191 173.0,98.191 176.0,96.049 179.0,96.049 182.0,93.25 185.0,93.25 188.0,89.992 191.0,89.992 194.0,86.5 197.0,100.0" opacity="0.6" fill="#005CFF" stroke="black" stroke-width="0"/>
+<line x1="40" y1="127.0" x2="40" y2="73.0" stroke="black" stroke-width="1" />
+<line x1="39.5" y1="100.0" x2="43.5" y2="100.0" stroke="black" stroke-width="1" />
+<line x1="39.5" y1="73.0" x2="43.5" y2="73.0" stroke="black" stroke-width="1" />
+<text text-anchor="end" font-family="Arial" x="36" y="77.0" font-size="8" >30.0</text>
+<line x1="39.5" y1="127.0" x2="43.5" y2="127.0" stroke="black" stroke-width="1" />
+<text text-anchor="end" font-family="Arial" x="36" y="131.0" font-size="8" >-30.0</text>
+<text text-anchor="start" font-family="Arial" x="39.5" y="66.0" font-size="7" >Chr1: 0-250</text>
+</svg>
diff --git a/Images/spark_pointstat_avg.svg b/Images/spark_pointstat_avg.svg
new file mode 100644
index 0000000..9493571
--- /dev/null
+++ b/Images/spark_pointstat_avg.svg
@@ -0,0 +1,9 @@
+<svg style="background:#ffffff" viewBox="0 0 320 210.0" xmlns="http://www.w3.org/2000/svg">
+<polygon points="50.0,100.0 57.5,83.17174515235457 65.0,77.86149584487535 72.5,83.17174515235457 80.0,88.78116343490305 87.5,83.17174515235457 95.0,88.78116343490305 102.5,73.37396121883657 110.0,88.78116343490305 117.5,83.17174515235457 125.0,88.78116343490305 132.5,73.74792243767313 140.0,88.78116343490305 147.5,83.17174515235457 155.0,88.78116343490305 162.5,73.0 170.0,88.78116343490305 177.5,74.1218836565097 185.0,88.78116343490305 192.5,100.0" opacity="1" fill="#0000C1" stroke="black" stroke-width="0"/>
+<line x1="40" y1="100.0" x2="40" y2="70.0" stroke="black" stroke-width="1" />
+<line x1="39.5" y1="100.0" x2="43.5" y2="100.0" stroke="black" stroke-width="1" />
+<line x1="39.5" y1="70.0" x2="43.5" y2="70.0" stroke="black" stroke-width="1" />
+<text text-anchor="end" font-family="Arial" x="36" y="104.0" font-size="8" >0</text>
+<text text-anchor="end" font-family="Arial" x="36" y="74.0" font-size="8" >39.7</text>
+<text text-anchor="start" font-family="Arial" x="39.5" y="66.0" font-size="7" >Chr1: 0-1,000</text>
+</svg>
diff --git a/Images/spark_pointstat_max.svg b/Images/spark_pointstat_max.svg
new file mode 100644
index 0000000..cccb610
--- /dev/null
+++ b/Images/spark_pointstat_max.svg
@@ -0,0 +1,9 @@
+<svg style="background:#ffffff" viewBox="0 0 320 210.0" xmlns="http://www.w3.org/2000/svg">
+<polygon points="50.0,100.0 57.5,91.5625 65.0,73.0 72.5,91.5625 80.0,93.86363636363636 87.5,91.5625 95.0,93.86363636363636 102.5,73.0 110.0,93.86363636363636 117.5,91.5625 125.0,93.86363636363636 132.5,73.0 140.0,93.86363636363636 147.5,91.5625 155.0,93.86363636363636 162.5,73.0 170.0,93.86363636363636 177.5,73.0 185.0,93.86363636363636 192.5,100.0" opacity="1" fill="#0000C1" stroke="black" stroke-width="0"/>
+<line x1="40" y1="100.0" x2="40" y2="70.0" stroke="black" stroke-width="1" />
+<line x1="39.5" y1="100.0" x2="43.5" y2="100.0" stroke="black" stroke-width="1" />
+<line x1="39.5" y1="70.0" x2="43.5" y2="70.0" stroke="black" stroke-width="1" />
+<text text-anchor="end" font-family="Arial" x="36" y="104.0" font-size="8" >0</text>
+<text text-anchor="end" font-family="Arial" x="36" y="74.0" font-size="8" >96.8</text>
+<text text-anchor="start" font-family="Arial" x="39.5" y="66.0" font-size="7" >Chr1: 0-1,000</text>
+</svg>
diff --git a/SparK.py b/SparK.py
index 1c2b518..6155b87 100644
--- a/SparK.py
+++ b/SparK.py
@@ -134,33 +134,39 @@ def make_raw_data_filled(stretch, files, offset):  # files[ctrl,treat]
                             except:
                                 pass
 
-    # shrink to max_datapoints if bigger
-    max_datapoints = max_points
-    if stretch[2] - stretch[1] > max_datapoints:
-        binfactor_split = math.modf(float((float(stretch[2] - stretch[1]))/max_datapoints))  # get values after and before period
-        binfactor = sum(binfactor_split)
-        temp_data = [[] for u in range(len(files))]  # new data list
-        for workingfilenr in range(len(files)):
-            for position in range(max_datapoints):
-                start_postition_split = math.modf(position * binfactor)  # after and before period
-
-                # first add fraction of start position or entire value if no fraction
-                temp_value = float(raw_data_filled[workingfilenr][(int(start_postition_split[1]))] * (1 - start_postition_split[0]))
-                binfactor_left = binfactor - (1 - start_postition_split[0])
-
-                # add all values with no fractions
-                iteration = 0
-                while binfactor_left > 1:
-                    temp_value += raw_data_filled[workingfilenr][int(start_postition_split[1]) + 1 + iteration]
-                    iteration += 1
-                    binfactor_left -= 1
-
-                # add last fraction or value if no fraction
-                if binfactor_left > 0:
-                    if float((start_postition_split[1]) + 1 + iteration) < len(raw_data_filled[0]):
-                        temp_value += raw_data_filled[workingfilenr][int(start_postition_split[1]) + 1 + iteration] * binfactor_left
-                        temp_data[workingfilenr].append(temp_value/sum(binfactor_split))
-        raw_data_filled = copy.deepcopy(temp_data)
+    # shrink to max_datapoints if bigger
+    max_datapoints = max_points
+    if stretch[2] - stretch[1] > max_datapoints:
+        binfactor_split = math.modf(float((float(stretch[2] - stretch[1])) / max_datapoints))  # get values after and before period
+        binfactor = sum(binfactor_split)
+        temp_data = [[] for u in range(len(files))]  # new data list
+        for workingfilenr in range(len(files)):
+            for position in range(max_datapoints):
+                start_postition_split = math.modf(position * binfactor)  # after and before period
+                start_idx = int(start_postition_split[1])
+                if point_stat == "max":
+                    end_pos = (position + 1) * binfactor
+                    end_idx = min(len(raw_data_filled[workingfilenr]) - 1, int(math.ceil(end_pos)) - 1)
+                    temp_data[workingfilenr].append(max(raw_data_filled[workingfilenr][start_idx:end_idx + 1]))
+                    continue
+
+                # first add fraction of start position or entire value if no fraction
+                temp_value = float(raw_data_filled[workingfilenr][start_idx] * (1 - start_postition_split[0]))
+                binfactor_left = binfactor - (1 - start_postition_split[0])
+
+                # add all values with no fractions
+                iteration = 0
+                while binfactor_left > 1:
+                    temp_value += raw_data_filled[workingfilenr][start_idx + 1 + iteration]
+                    iteration += 1
+                    binfactor_left -= 1
+
+                # add last fraction or value if no fraction
+                if binfactor_left > 0:
+                    if float(start_idx + 1 + iteration) < len(raw_data_filled[0]):
+                        temp_value += raw_data_filled[workingfilenr][start_idx + 1 + iteration] * binfactor_left
+                        temp_data[workingfilenr].append(temp_value / sum(binfactor_split))
+        raw_data_filled = copy.deepcopy(temp_data)
 
     if smoothen_tracks is not None:
         raw_data_filled_smooth = [[0] * max_datapoints for r in range(len(files))]
@@ -236,22 +242,24 @@ def draw_axis_for_group(y_start_val, max_value_val, has_negative_axis):
 
         write_to_file('''<text text-anchor="end" font-family="Arial" x="''' + str(x_start - 14) + '''" y="''' + str(y_start_val + 4) + '''" font-size="''' + str(font_size_axis_y) + '''" >0</text>''')
         write_to_file('''<text text-anchor="end" font-family="Arial" x="''' + str(x_start - 14) + '''" y="''' + str(y_start_val - hight + 4) + '''" font-size="''' + str(font_size_axis_y) + '''" >''' + str(axis_label) + '''</text>''')
-def draw_sine_axis_for_group(y_start_val, pos_max_value_val, neg_max_value_val):
-    # Separate top/bottom labels derived from positive and negative datasets
-    axis_label_top = round(pos_max_value_val * (1 + (1 - relative_track_hight_percentage)), 1)
-    axis_label_bottom = round(neg_max_value_val * (1 + (1 - relative_track_hight_percentage)), 1)
-    # Draw vertical axis
-    write_to_file('''<line x1="''' + str(x_start - 10) + '''" y1="''' + str(y_start_val + hight) + '''" x2="''' + str(x_start - 10) + '''" y2="''' + str(y_start_val - hight) + '''" stroke="black" stroke-width="1" />''')
-    # 0 tick
-    write_to_file('''<line x1="''' + str(x_start - 10.5) + '''" y1="''' + str(y_start_val) + '''" x2="''' + str(x_start - 6.5) + '''" y2="''' + str(y_start_val) + '''" stroke="black" stroke-width="1" />''')
-    # Top tick and label
-    write_to_file('''<line x1="''' + str(x_start - 10.5) + '''" y1="''' + str(y_start_val - hight) + '''" x2="''' + str(x_start - 6.5) + '''" y2="''' + str(y_start_val - hight) + '''" stroke="black" stroke-width="1" />''')
-    write_to_file('''<text text-anchor="end" font-family="Arial" x="''' + str(x_start - 14) + '''" y="''' + str(y_start_val - hight + 4) + '''" font-size="''' + str(font_size_axis_y) + '''" >''' + str(axis_label_top) + '''</text>''')
-    # Bottom tick and label
-    write_to_file('''<line x1="''' + str(x_start - 10.5) + '''" y1="''' + str(y_start_val + hight) + '''" x2="''' + str(x_start - 6.5) + '''" y2="''' + str(y_start_val + hight) + '''" stroke="black" stroke-width="1" />''')
-    write_to_file('''<text text-anchor="end" font-family="Arial" x="''' + str(x_start - 14) + '''" y="''' + str(y_start_val + hight + 4) + '''" font-size="''' + str(font_size_axis_y) + '''" >-''' + str(axis_label_bottom) + '''</text>''')
-def draw_standard_spark():
-    summary_func = np.max if point_stat == "max" else np.average
+def draw_sine_axis_for_group(y_start_val, shared_max_val):
+    # Shared axis with symmetric labels for positive/negative magnitudes
+    if shared_max_val > 0:
+        axis_height = hight * relative_track_hight_percentage
+        pos_tick_y = y_start_val - axis_height
+        neg_tick_y = y_start_val + axis_height
+        # Draw full shared axis
+        write_to_file('''<line x1="''' + str(x_start - 10) + '''" y1="''' + str(neg_tick_y) + '''" x2="''' + str(x_start - 10) + '''" y2="''' + str(pos_tick_y) + '''" stroke="black" stroke-width="1" />''')
+        # 0 tick
+        write_to_file('''<line x1="''' + str(x_start - 10.5) + '''" y1="''' + str(y_start_val) + '''" x2="''' + str(x_start - 6.5) + '''" y2="''' + str(y_start_val) + '''" stroke="black" stroke-width="1" />''')
+        # Positive tick and label
+        write_to_file('''<line x1="''' + str(x_start - 10.5) + '''" y1="''' + str(pos_tick_y) + '''" x2="''' + str(x_start - 6.5) + '''" y2="''' + str(pos_tick_y) + '''" stroke="black" stroke-width="1" />''')
+        write_to_file('''<text text-anchor="end" font-family="Arial" x="''' + str(x_start - 14) + '''" y="''' + str(pos_tick_y + 4) + '''" font-size="''' + str(font_size_axis_y) + '''" >''' + str(round(shared_max_val, 1)) + '''</text>''')
+        # Negative tick and label
+        write_to_file('''<line x1="''' + str(x_start - 10.5) + '''" y1="''' + str(neg_tick_y) + '''" x2="''' + str(x_start - 6.5) + '''" y2="''' + str(neg_tick_y) + '''" stroke="black" stroke-width="1" />''')
+        write_to_file('''<text text-anchor="end" font-family="Arial" x="''' + str(x_start - 14) + '''" y="''' + str(neg_tick_y + 4) + '''" font-size="''' + str(font_size_axis_y) + '''" >-''' + str(round(shared_max_val, 1)) + '''</text>''')
+def draw_standard_spark():
+    summary_func = np.average
     if len(control_data) > 1 and len(treat_data) > 1:
         last_xpos = -1
         coords = []  # y/x, spark color
@@ -356,7 +364,7 @@ def get_region_to_draw():
 parser.add_argument('-w','--track_width', help='width of the track, default = 150, int', required=False, type=int, default=150)
 parser.add_argument('-dg','--display_genes', help='genes to display from the gtf file', nargs='+', required=False, type=str)
 parser.add_argument('--max_points', help='maximum datapoints per plot', required=False, type=int, default=2000)
-parser.add_argument('--point_stat', help='per-point statistic: average or max', required=False, type=str, default='average')
+parser.add_argument('--point_stat', help='per-bin statistic for downsampling: average or max', required=False, type=str, default='average')
 parser.add_argument('--y_scale', help='scale factor for y-axis', required=False, type=float, default=1.0)
 parser.add_argument('--x_scale', help='scale factor for x-axis', required=False, type=float, default=1.0)
 parser.add_argument('-dt','--display_transcripts', help='display custom transcripts. By default, all transcripts annotated in the gtf file will be merged and displayed as one gene. Alternatively all can be plotted seperatelly by setting this to "all". Further, Transcript IDs can be listed to plot only certain transcripts', nargs='+', required=False, type=str, default=["mergeall"])
@@ -750,27 +758,26 @@ def get_region_to_draw():
             print("Error: STD plots require at least 2 control and treatment files per plot")
 
     elif plot_type == "sine": # treat points up, control points down #FIX combined with averages does not work
-        # Compute separate positive/negative maxima for independent axis labels and scaling
+        # Compute shared max so positive/negative sides use the same y-scale
         pos_max_value = 0
         neg_max_value = 0
         if treat_data:
             pos_max_value = max(max(abs(v) for v in data) for data in treat_data)
         if control_data:
             neg_max_value = max(max(abs(v) for v in data) for data in control_data)
+        shared_max_value = max(pos_max_value, neg_max_value)
         # Respect custom scales or group autoscale by overriding both sides equally
         if custom_scales is not None and custom_scales[group] != "D":
-            pos_max_value = float(custom_scales[group])
-            neg_max_value = float(custom_scales[group])
+            shared_max_value = float(custom_scales[group])
         elif group_autoscale == "yes" and ((group + 1) not in group_autoscale_excluded):
-            pos_max_value = max_value
-            neg_max_value = max_value
+            shared_max_value = max_value
 
         if len(control_data) >= 1 and len(treat_data) >= 1:
             for datafile in control_data:
                 coords = []  # y, x
                 for x, value in enumerate(datafile):
                     x_pos = x_start + (x * quantile)
-                    coords.append([-1 * get_relative_hight_custom(value, neg_max_value), x_pos])
+                    coords.append([-1 * get_relative_hight_custom(value, shared_max_value), x_pos])
                 coords[-1][0] = 0
                 coords[0][0] = 0
                 write_to_file(draw_polygon(coords, opacity, fills[0], stroke_width))
@@ -778,7 +785,7 @@ def get_region_to_draw():
                 coords = []  # y, x
                 for x, value in enumerate(datafile):
                     x_pos = x_start + (x * quantile)
-                    coords.append([get_relative_hight_custom(value, pos_max_value), x_pos])
+                    coords.append([get_relative_hight_custom(value, shared_max_value), x_pos])
                 coords[-1][0] = 0
                 coords[0][0] = 0
                 write_to_file(draw_polygon(coords, opacity, fills[1], stroke_width))
@@ -857,8 +864,8 @@ def get_region_to_draw():
                         write_to_file(draw_polygon(coords, 0.8, spark_color[1], stroke_width_spark))
         else:
             print("Error: no input files for treatment and/or control")
-        # Draw y-axis for this group (sine) with independent labels
-        draw_sine_axis_for_group(y_start, pos_max_value, neg_max_value)
+        # Draw y-axis for this group (sine) with shared scale and symmetric labels
+        draw_sine_axis_for_group(y_start, shared_max_value)
 
 # Scalebar
 if display_scalebar == "yes":