From 7e34218cf8d9d5736bc4949518b6b98fbe3be0f5 Mon Sep 17 00:00:00 2001
From: Eric <emcginnis@splunk.com>
Date: Tue, 1 Jul 2025 10:20:49 -0700
Subject: [PATCH 1/7] distribute scheduling

---
 .../detection_abstract.py                     | 69 +++++++++++++++++++
 .../templates/savedsearches_detections.j2     |  6 +-
 2 files changed, 72 insertions(+), 3 deletions(-)

diff --git a/contentctl/objects/abstract_security_content_objects/detection_abstract.py b/contentctl/objects/abstract_security_content_objects/detection_abstract.py
index 81e8f737..aebe7c64 100644
--- a/contentctl/objects/abstract_security_content_objects/detection_abstract.py
+++ b/contentctl/objects/abstract_security_content_objects/detection_abstract.py
@@ -57,6 +57,11 @@
 # Those AnalyticsTypes that we do not test via contentctl
 SKIPPED_ANALYTICS_TYPES: set[str] = {AnalyticsType.Correlation}
 
+import random
+
+GLOBAL_COUNTER = 0
+random.seed(42)  # For reproducibility in tests
+
 
 class Detection_Abstract(SecurityContentObject):
     name: str = Field(..., max_length=CONTENTCTL_MAX_SEARCH_NAME_LENGTH)
@@ -70,6 +75,70 @@ class Detection_Abstract(SecurityContentObject):
     known_false_positives: str = Field(..., min_length=4)
     rba: Optional[RBAObject] = Field(default=None)
 
+    @computed_field
+    @property
+    def statistically_disabled(self) -> str:
+        global GLOBAL_COUNTER
+        """
+        Returns a string that indicates whether the detection is statistically disabled.
+        This is used to determine whether or not in test app builds, for the purposes
+        of performance testing, this detection should be enabled by default or not.
+        """
+
+        # Convert the UUID and mod by 100, letting us set probability of this
+        # search being enabled between 0 and 100
+
+        PERCENT_OF_SEARCHES_TO_ENABLE = 10
+        # Remember, the name of this field is disabled, so 0 means the search
+        # should be "enabled" and 1 means disabled.  Kind of feels backwards.
+        if random.randint(0, 99) < PERCENT_OF_SEARCHES_TO_ENABLE:
+            return "false"
+        else:
+            return "true"
+
+    @computed_field
+    @property
+    def calculated_cron(self) -> str:
+        global GLOBAL_COUNTER
+        """
+        Returns the cron expression for the detection.
+        Read the docs here to have a better understranding of what cron
+        expressions are skewable (and good or bad candidates for skewing):
+        https://docs.splunk.com/Documentation/SplunkCloud/latest/Report/Skewscheduledreportstarttimes#How_the_search_schedule_affects_the_potential_schedule_offset
+
+        """
+        """
+        # Convert the UUID, which is unique per detection, to an integer.
+        uuid_as_int = int(self.id)
+        name_hash = hash(self.name)
+
+        # Then, mod this by 60.  This should give us a fairly random distribution from 0-60
+        MIN_TIME = 0
+        MAX_TIME = 59
+        TIME_DIFF = (MAX_TIME + 1) - MIN_TIME
+
+        # We do this instead of imply using randrandge or similar because using the UUID makes
+        # generation of the cron schedule deterministic, which is useful for testing different
+        # windows.  For example, there is a good chance we may get another request to not have
+        # things starts within the first 5 minutes, given that many other searches are scheduled
+        # in ES to kick off at that time.
+        new_start_minute = name_hash % TIME_DIFF
+
+        # Every cron schedule for an ESCU Search is 0 * * * *, we we will just substitute what
+        # we generated above, ignoring what is actually in the deploymnet
+        """
+        # The spacing of the above implementation winds up being quite poor, maybe because
+        # our sample size is too small to approach a uniform distribution.
+        # So just use an int and mod it
+        MIN_TIME = 0
+        MAX_TIME = 59
+        TIME_DIFF = (MAX_TIME + 1) - MIN_TIME
+        new_start_minute = GLOBAL_COUNTER % TIME_DIFF
+        GLOBAL_COUNTER = GLOBAL_COUNTER + 1
+
+        # return "0 * * * *"
+        return f"{new_start_minute} * * * *"
+
     @computed_field
     @property
     def risk_score(self) -> RiskScoreValue_Type:
diff --git a/contentctl/output/templates/savedsearches_detections.j2 b/contentctl/output/templates/savedsearches_detections.j2
index d1ef66b9..d2c0537c 100644
--- a/contentctl/output/templates/savedsearches_detections.j2
+++ b/contentctl/output/templates/savedsearches_detections.j2
@@ -31,7 +31,7 @@ action.risk.param._risk = {{ detection.risk | tojson }}
 action.risk.param._risk_score = 0
 action.risk.param.verbose = 0
 {% endif %}
-cron_schedule = {{ detection.deployment.scheduling.cron_schedule }}
+cron_schedule = {{ detection.calculated_cron }}
 dispatch.earliest_time = {{ detection.deployment.scheduling.earliest_time }}
 dispatch.latest_time = {{ detection.deployment.scheduling.latest_time }}
 action.correlationsearch.enabled = 1
@@ -70,7 +70,7 @@ action.sendtophantom.param.sensitivity = {{ detection.deployment.alert_action.ph
 action.sendtophantom.param.severity = {{ detection.deployment.alert_action.phantom.severity | custom_jinja2_enrichment_filter(detection) }}
 {% endif %}
 alert.digest_mode = 1
-disabled = {{ (not detection.enabled_by_default) | lower }}
+disabled = {{ detection.statistically_disabled }}
 enableSched = 1
 allow_skew = 100%
 counttype = number of events
@@ -80,7 +80,7 @@ realtime_schedule = 0
 is_visible = false
 {% if detection.tags.throttling %}
 alert.suppress = true
-alert.suppress.fields = {{ detection.tags.throttling.conf_formatted_fields() }}
+alert.suppress.fields = {{ detection.tags.throttling.conf_formatted_fields }}
 alert.suppress.period = {{ detection.tags.throttling.period }}
 {% endif %}
 search = {{ detection.search | escapeNewlines() }}

From c04b5d40b3ff5eff66d046f5d10b050ef5f2e7ba Mon Sep 17 00:00:00 2001
From: Eric <emcginnis@splunk.com>
Date: Tue, 1 Jul 2025 16:22:47 -0700
Subject: [PATCH 2/7] Alert suppression automatically derived from RBA
 risk_object and threat_objects fields with a period of 86400s, 24 hrs. No
 alert_groups are configured. Experimental content with invalid RBA configs
 per the detection SPL generate warnings, not errors.

---
 .../detection_abstract.py                     | 41 +++++++++++--
 contentctl/objects/baseline.py                | 57 +++++++++++++++++++
 contentctl/objects/throttling.py              |  5 +-
 .../templates/savedsearches_baselines.j2      |  2 +-
 4 files changed, 97 insertions(+), 8 deletions(-)

diff --git a/contentctl/objects/abstract_security_content_objects/detection_abstract.py b/contentctl/objects/abstract_security_content_objects/detection_abstract.py
index aebe7c64..a96c3d31 100644
--- a/contentctl/objects/abstract_security_content_objects/detection_abstract.py
+++ b/contentctl/objects/abstract_security_content_objects/detection_abstract.py
@@ -52,6 +52,7 @@
 from contentctl.objects.rba import RBAObject, RiskScoreValue_Type
 from contentctl.objects.security_content_object import SecurityContentObject
 from contentctl.objects.test_group import TestGroup
+from contentctl.objects.throttling import Throttling
 from contentctl.objects.unit_test import UnitTest
 
 # Those AnalyticsTypes that we do not test via contentctl
@@ -127,17 +128,27 @@ def calculated_cron(self) -> str:
         # Every cron schedule for an ESCU Search is 0 * * * *, we we will just substitute what
         # we generated above, ignoring what is actually in the deploymnet
         """
+
         # The spacing of the above implementation winds up being quite poor, maybe because
         # our sample size is too small to approach a uniform distribution.
         # So just use an int and mod it
         MIN_TIME = 0
-        MAX_TIME = 59
+        MAX_TIME = 14
         TIME_DIFF = (MAX_TIME + 1) - MIN_TIME
         new_start_minute = GLOBAL_COUNTER % TIME_DIFF
         GLOBAL_COUNTER = GLOBAL_COUNTER + 1
 
+        if self.type is AnalyticsType.TTP:
+            minute_start = new_start_minute % 15
+            minute_stop = minute_start + 45
+
+            return self.deployment.scheduling.cron_schedule.format(
+                minute_range=f"{minute_start}-{minute_stop}"
+            )
+
         # return "0 * * * *"
-        return f"{new_start_minute} * * * *"
+
+        return self.deployment.scheduling.cron_schedule.format(minute=new_start_minute)
 
     @computed_field
     @property
@@ -873,22 +884,40 @@ def addTags_nist(self):
         return self
 
     @model_validator(mode="after")
-    def ensureThrottlingFieldsExist(self):
+    def automaticallyCreateThrottling(self, default_throttling_period: str = "86400s"):
         """
+        If throttling is not explicitly configured, then automatically create
+        it from the risk and threat objects defined in the RBA config.
+
+
         For throttling to work properly, the fields to throttle on MUST
         exist in the search itself.  If not, then we cannot apply the throttling
         """
         if self.tags.throttling is None:
             # No throttling configured for this detection
-            return self
+
+            # Automatically add throttling fields based on the risk and threat objects
+            if self.rba is None:
+                # Cannot add any throttling because there is no RBA config
+                return self
+
+            self.tags.throttling = Throttling(
+                fields=[ro.field for ro in self.rba.risk_objects]  # type: ignore
+                + [to.field for to in self.rba.threat_objects],  # type: ignore
+                period=default_throttling_period,  # provide a default period of 1 day
+            )
 
         missing_fields: list[str] = [
             field for field in self.tags.throttling.fields if field not in self.search
         ]
         if len(missing_fields) > 0:
-            raise ValueError(
-                f"The following throttle fields were missing from the search: {missing_fields}"
+            print(
+                f"\nThe following throttle fields were missing from the search [{self.name}]. This is just a warning for now since this is an experimental feature: {missing_fields}\n"
             )
+            return self
+            # raise ValueError(
+            #     f"The following throttle fields were missing from the search [{self.name}]: {missing_fields}"
+            # )
 
         else:
             # All throttling fields present in search
diff --git a/contentctl/objects/baseline.py b/contentctl/objects/baseline.py
index d5ed5520..eec73ab6 100644
--- a/contentctl/objects/baseline.py
+++ b/contentctl/objects/baseline.py
@@ -15,6 +15,9 @@
     model_serializer,
 )
 
+from contentctl.objects.abstract_security_content_objects.detection_abstract import (
+    GLOBAL_COUNTER,
+)
 from contentctl.objects.baseline_tags import BaselineTags
 from contentctl.objects.config import CustomApp
 from contentctl.objects.constants import (
@@ -39,6 +42,60 @@ class Baseline(SecurityContentObject):
     deployment: Deployment = Field({})
     status: ContentStatus
 
+    @computed_field
+    @property
+    def calculated_cron(self) -> str:
+        global GLOBAL_COUNTER
+        """
+        Returns the cron expression for the detection.
+        Read the docs here to have a better understranding of what cron
+        expressions are skewable (and good or bad candidates for skewing):
+        https://docs.splunk.com/Documentation/SplunkCloud/latest/Report/Skewscheduledreportstarttimes#How_the_search_schedule_affects_the_potential_schedule_offset
+
+        """
+        """
+        # Convert the UUID, which is unique per detection, to an integer.
+        uuid_as_int = int(self.id)
+        name_hash = hash(self.name)
+
+        # Then, mod this by 60.  This should give us a fairly random distribution from 0-60
+        MIN_TIME = 0
+        MAX_TIME = 59
+        TIME_DIFF = (MAX_TIME + 1) - MIN_TIME
+
+        # We do this instead of imply using randrandge or similar because using the UUID makes
+        # generation of the cron schedule deterministic, which is useful for testing different
+        # windows.  For example, there is a good chance we may get another request to not have
+        # things starts within the first 5 minutes, given that many other searches are scheduled
+        # in ES to kick off at that time.
+        new_start_minute = name_hash % TIME_DIFF
+
+        # Every cron schedule for an ESCU Search is 0 * * * *, we we will just substitute what
+        # we generated above, ignoring what is actually in the deploymnet
+        """
+
+        # The spacing of the above implementation winds up being quite poor, maybe because
+        # our sample size is too small to approach a uniform distribution.
+        # So just use an int and mod it
+        MIN_TIME = 0
+        MAX_TIME = 14
+        TIME_DIFF = (MAX_TIME + 1) - MIN_TIME
+        new_start_minute = GLOBAL_COUNTER % TIME_DIFF
+        GLOBAL_COUNTER = GLOBAL_COUNTER + 1
+
+        new_start_minute = GLOBAL_COUNTER % TIME_DIFF
+        GLOBAL_COUNTER = GLOBAL_COUNTER + 1
+
+        try:
+            return self.deployment.scheduling.cron_schedule.format(
+                minute=new_start_minute
+            )
+        except Exception as e:
+            print(e)
+            import code
+
+            code.interact(local=locals())
+
     @field_validator("status", mode="after")
     @classmethod
     def NarrowStatus(cls, status: ContentStatus) -> ContentStatus:
diff --git a/contentctl/objects/throttling.py b/contentctl/objects/throttling.py
index de6f9cd9..674ae79a 100644
--- a/contentctl/objects/throttling.py
+++ b/contentctl/objects/throttling.py
@@ -1,6 +1,7 @@
-from pydantic import BaseModel, Field, field_validator
 from typing import Annotated
 
+from pydantic import BaseModel, Field, computed_field, field_validator
+
 
 # Alert Suppression/Throttling settings have been taken from
 # https://docs.splunk.com/Documentation/Splunk/9.2.2/Admin/Savedsearchesconf
@@ -28,6 +29,8 @@ def no_spaces_in_fields(cls, v: list[str]) -> list[str]:
                 )
         return v
 
+    @computed_field
+    @property
     def conf_formatted_fields(self) -> str:
         """
         TODO:
diff --git a/contentctl/output/templates/savedsearches_baselines.j2 b/contentctl/output/templates/savedsearches_baselines.j2
index 28e8a31b..378b9a0f 100644
--- a/contentctl/output/templates/savedsearches_baselines.j2
+++ b/contentctl/output/templates/savedsearches_baselines.j2
@@ -17,7 +17,7 @@ action.escu.analytic_story = {{ objectListToNameList(detection.tags.analytic_sto
 action.escu.analytic_story = []
 {% endif %}
 action.escu.data_models = {{ detection.datamodel | tojson }}
-cron_schedule = {{ detection.deployment.scheduling.cron_schedule }}
+cron_schedule = {{ detection.calculated_cron }}
 enableSched = 1
 dispatch.earliest_time = {{ detection.deployment.scheduling.earliest_time }}
 dispatch.latest_time = {{ detection.deployment.scheduling.latest_time }}

From 8d62bd9c6c69f5622281d48a1a601830432417c0 Mon Sep 17 00:00:00 2001
From: Eric <emcginnis@splunk.com>
Date: Tue, 1 Jul 2025 16:24:30 -0700
Subject: [PATCH 3/7] no searches enabled by default

---
 .../abstract_security_content_objects/detection_abstract.py     | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/contentctl/objects/abstract_security_content_objects/detection_abstract.py b/contentctl/objects/abstract_security_content_objects/detection_abstract.py
index a96c3d31..993fef6f 100644
--- a/contentctl/objects/abstract_security_content_objects/detection_abstract.py
+++ b/contentctl/objects/abstract_security_content_objects/detection_abstract.py
@@ -89,7 +89,7 @@ def statistically_disabled(self) -> str:
         # Convert the UUID and mod by 100, letting us set probability of this
         # search being enabled between 0 and 100
 
-        PERCENT_OF_SEARCHES_TO_ENABLE = 10
+        PERCENT_OF_SEARCHES_TO_ENABLE = 0
         # Remember, the name of this field is disabled, so 0 means the search
         # should be "enabled" and 1 means disabled.  Kind of feels backwards.
         if random.randint(0, 99) < PERCENT_OF_SEARCHES_TO_ENABLE:

From 4f4c9e2122198e056baaee49dd90795ea746a1f2 Mon Sep 17 00:00:00 2001
From: Eric <emcginnis@splunk.com>
Date: Tue, 1 Jul 2025 16:27:45 -0700
Subject: [PATCH 4/7] move import

---
 .../abstract_security_content_objects/detection_abstract.py     | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/contentctl/objects/abstract_security_content_objects/detection_abstract.py b/contentctl/objects/abstract_security_content_objects/detection_abstract.py
index 993fef6f..5189af0c 100644
--- a/contentctl/objects/abstract_security_content_objects/detection_abstract.py
+++ b/contentctl/objects/abstract_security_content_objects/detection_abstract.py
@@ -25,6 +25,7 @@
     from contentctl.objects.config import CustomApp
 
 import datetime
+import random
 from functools import cached_property
 
 from contentctl.enrichments.cve_enrichment import CveEnrichmentObj
@@ -58,7 +59,6 @@
 # Those AnalyticsTypes that we do not test via contentctl
 SKIPPED_ANALYTICS_TYPES: set[str] = {AnalyticsType.Correlation}
 
-import random
 
 GLOBAL_COUNTER = 0
 random.seed(42)  # For reproducibility in tests

From b13f824be38673631f2b5953d525e2f547a7da28 Mon Sep 17 00:00:00 2001
From: Eric <emcginnis@splunk.com>
Date: Tue, 1 Jul 2025 16:39:50 -0700
Subject: [PATCH 5/7] fix baseline interval

---
 contentctl/objects/baseline.py | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/contentctl/objects/baseline.py b/contentctl/objects/baseline.py
index eec73ab6..70f59812 100644
--- a/contentctl/objects/baseline.py
+++ b/contentctl/objects/baseline.py
@@ -83,9 +83,6 @@ def calculated_cron(self) -> str:
         new_start_minute = GLOBAL_COUNTER % TIME_DIFF
         GLOBAL_COUNTER = GLOBAL_COUNTER + 1
 
-        new_start_minute = GLOBAL_COUNTER % TIME_DIFF
-        GLOBAL_COUNTER = GLOBAL_COUNTER + 1
-
         try:
             return self.deployment.scheduling.cron_schedule.format(
                 minute=new_start_minute

From e1c0bd70177d6db87a544ebb75d978d02ab0f007 Mon Sep 17 00:00:00 2001
From: Eric <emcginnis@splunk.com>
Date: Thu, 17 Jul 2025 15:57:49 -0700
Subject: [PATCH 6/7] Don't change start mintues. do apply throttling where
 applicable

---
 .../detection_abstract.py                     | 72 +++++++++++++++----
 1 file changed, 58 insertions(+), 14 deletions(-)

diff --git a/contentctl/objects/abstract_security_content_objects/detection_abstract.py b/contentctl/objects/abstract_security_content_objects/detection_abstract.py
index 5189af0c..97c3497b 100644
--- a/contentctl/objects/abstract_security_content_objects/detection_abstract.py
+++ b/contentctl/objects/abstract_security_content_objects/detection_abstract.py
@@ -2,6 +2,7 @@
 
 import pathlib
 import re
+import sys
 from enum import StrEnum
 from typing import TYPE_CHECKING, Annotated, Any, List, Optional, Union
 
@@ -59,8 +60,40 @@
 # Those AnalyticsTypes that we do not test via contentctl
 SKIPPED_ANALYTICS_TYPES: set[str] = {AnalyticsType.Correlation}
 
+import questionary
 
-GLOBAL_COUNTER = 0
+try:
+    PERCENTAGE_OF_SEARCHES_TO_ENABLE_BY_DEFAULT = int(
+        questionary.text(
+            "Enter the percentage of searches (as a whole number integer) you want to enable by default",
+            default="0",
+        ).ask()
+    )
+
+    EXACT_START_MINUTE: bool = questionary.confirm(
+        "Shall we assign EXACT start minute for each detection? \n'Yes' "
+        "will assign an exact start minute, while 'No' will assign a "
+        "minute of '0' and result in maximal skew"
+    ).ask()
+
+    if EXACT_START_MINUTE:
+        DETERMINISTIC_START_TIMES: bool = questionary.confirm(
+            "Shall we deterministicly spread detection start times between 0-59 minutes,"
+            " with their start times the same between different builds? \nChoosing 'Yes' will "
+            "mean that some minutes have more searches scheduled than other minutes.\n"
+            "Choosing 'No' will mean that the start time for a specific search can change from build to build"
+        ).ask()
+    else:
+        # If we are not starting at an exact minute, then we will always start
+        # at minute 0 which leaves ambiguity as the decision is made by splunk scheduler
+        DETERMINISTIC_START_TIMES: bool = False
+
+
+except Exception as e:
+    print(f"Issue getting answers for the build. Quitting... \n{str(e)}")
+    sys.exit(1)
+
+GLOBAL_COUNTER = -1
 random.seed(42)  # For reproducibility in tests
 
 
@@ -89,10 +122,9 @@ def statistically_disabled(self) -> str:
         # Convert the UUID and mod by 100, letting us set probability of this
         # search being enabled between 0 and 100
 
-        PERCENT_OF_SEARCHES_TO_ENABLE = 0
         # Remember, the name of this field is disabled, so 0 means the search
         # should be "enabled" and 1 means disabled.  Kind of feels backwards.
-        if random.randint(0, 99) < PERCENT_OF_SEARCHES_TO_ENABLE:
+        if random.randint(0, 99) < PERCENTAGE_OF_SEARCHES_TO_ENABLE_BY_DEFAULT:
             return "false"
         else:
             return "true"
@@ -128,27 +160,39 @@ def calculated_cron(self) -> str:
         # Every cron schedule for an ESCU Search is 0 * * * *, we we will just substitute what
         # we generated above, ignoring what is actually in the deploymnet
         """
+        GLOBAL_COUNTER += 1
+        if not EXACT_START_MINUTE:
+            if self.type is AnalyticsType.TTP:
+                return self.deployment.scheduling.cron_schedule.format(minute="*")
+            else:
+                return self.deployment.scheduling.cron_schedule.format(minute="0")
+
+        if DETERMINISTIC_START_TIMES:
+            uuid_as_int = int(self.id)
+            if self.type is AnalyticsType.TTP:
+                # TTP run every 15 minutes, so mod this by 15
+                start_minute = uuid_as_int % 15
+            else:
+                start_minute = uuid_as_int % 60
 
         # The spacing of the above implementation winds up being quite poor, maybe because
         # our sample size is too small to approach a uniform distribution.
         # So just use an int and mod it
-        MIN_TIME = 0
-        MAX_TIME = 14
-        TIME_DIFF = (MAX_TIME + 1) - MIN_TIME
-        new_start_minute = GLOBAL_COUNTER % TIME_DIFF
-        GLOBAL_COUNTER = GLOBAL_COUNTER + 1
+
+        # Try our best to spread these as evenly as possible
+        #
 
         if self.type is AnalyticsType.TTP:
-            minute_start = new_start_minute % 15
+            minute_start = GLOBAL_COUNTER % 15
             minute_stop = minute_start + 45
 
             return self.deployment.scheduling.cron_schedule.format(
                 minute_range=f"{minute_start}-{minute_stop}"
             )
 
-        # return "0 * * * *"
-
-        return self.deployment.scheduling.cron_schedule.format(minute=new_start_minute)
+        return self.deployment.scheduling.cron_schedule.format(
+            minute=GLOBAL_COUNTER % 60
+        )
 
     @computed_field
     @property
@@ -884,7 +928,7 @@ def addTags_nist(self):
         return self
 
     @model_validator(mode="after")
-    def automaticallyCreateThrottling(self, default_throttling_period: str = "86400s"):
+    def automaticallyCreateThrottling(self, default_throttling_period: str = "3600s"):
         """
         If throttling is not explicitly configured, then automatically create
         it from the risk and threat objects defined in the RBA config.
@@ -904,7 +948,7 @@ def automaticallyCreateThrottling(self, default_throttling_period: str = "86400s
             self.tags.throttling = Throttling(
                 fields=[ro.field for ro in self.rba.risk_objects]  # type: ignore
                 + [to.field for to in self.rba.threat_objects],  # type: ignore
-                period=default_throttling_period,  # provide a default period of 1 day
+                period=default_throttling_period,  # provide a default period in line with the argument to this function
             )
 
         missing_fields: list[str] = [

From a4236df9878d5a2e1dc96a8431d71601bcaee8bc Mon Sep 17 00:00:00 2001
From: Eric <emcginnis@splunk.com>
Date: Thu, 17 Jul 2025 16:29:52 -0700
Subject: [PATCH 7/7] another update that prevents distributing searches for
 now

---
 .../detection_abstract.py                     |  5 ++-
 contentctl/objects/baseline.py                | 37 +++++++++++++------
 2 files changed, 30 insertions(+), 12 deletions(-)

diff --git a/contentctl/objects/abstract_security_content_objects/detection_abstract.py b/contentctl/objects/abstract_security_content_objects/detection_abstract.py
index 97c3497b..ae0db76b 100644
--- a/contentctl/objects/abstract_security_content_objects/detection_abstract.py
+++ b/contentctl/objects/abstract_security_content_objects/detection_abstract.py
@@ -160,14 +160,17 @@ def calculated_cron(self) -> str:
         # Every cron schedule for an ESCU Search is 0 * * * *, we we will just substitute what
         # we generated above, ignoring what is actually in the deploymnet
         """
+
         GLOBAL_COUNTER += 1
         if not EXACT_START_MINUTE:
             if self.type is AnalyticsType.TTP:
                 return self.deployment.scheduling.cron_schedule.format(minute="*")
             else:
                 return self.deployment.scheduling.cron_schedule.format(minute="0")
-
+        print("\nEXACT START MINUTE IS NOT SUPPORTED ANYMORE.\n")
+        sys.exit(1)
         if DETERMINISTIC_START_TIMES:
+            sys.exit(1)
             uuid_as_int = int(self.id)
             if self.type is AnalyticsType.TTP:
                 # TTP run every 15 minutes, so mod this by 15
diff --git a/contentctl/objects/baseline.py b/contentctl/objects/baseline.py
index 70f59812..9e367921 100644
--- a/contentctl/objects/baseline.py
+++ b/contentctl/objects/baseline.py
@@ -16,6 +16,8 @@
 )
 
 from contentctl.objects.abstract_security_content_objects.detection_abstract import (
+    DETERMINISTIC_START_TIMES,
+    EXACT_START_MINUTE,
     GLOBAL_COUNTER,
 )
 from contentctl.objects.baseline_tags import BaselineTags
@@ -74,24 +76,37 @@ def calculated_cron(self) -> str:
         # we generated above, ignoring what is actually in the deploymnet
         """
 
+        GLOBAL_COUNTER += 1
+        if not EXACT_START_MINUTE:
+            return self.deployment.scheduling.cron_schedule.format(minute="0")
+
+        print("\nEXACT START MINUTE IS NOT SUPPORTED ANYMORE.\n")
+        import sys
+
+        sys.exit(1)
+        if DETERMINISTIC_START_TIMES:
+            sys.exit(1)
+            uuid_as_int = int(self.id)
+            start_minute = uuid_as_int % 60
+
         # The spacing of the above implementation winds up being quite poor, maybe because
         # our sample size is too small to approach a uniform distribution.
         # So just use an int and mod it
-        MIN_TIME = 0
-        MAX_TIME = 14
-        TIME_DIFF = (MAX_TIME + 1) - MIN_TIME
-        new_start_minute = GLOBAL_COUNTER % TIME_DIFF
-        GLOBAL_COUNTER = GLOBAL_COUNTER + 1
 
-        try:
+        # Try our best to spread these as evenly as possible
+        #
+
+        if self.type is AnalyticsType.TTP:
+            minute_start = GLOBAL_COUNTER % 15
+            minute_stop = minute_start + 45
+
             return self.deployment.scheduling.cron_schedule.format(
-                minute=new_start_minute
+                minute_range=f"{minute_start}-{minute_stop}"
             )
-        except Exception as e:
-            print(e)
-            import code
 
-            code.interact(local=locals())
+        return self.deployment.scheduling.cron_schedule.format(
+            minute=GLOBAL_COUNTER % 60
+        )
 
     @field_validator("status", mode="after")
     @classmethod