Spaces:

abrown31
/

open-range

Runtime error

Aaron Brown commited on Mar 8

Commit

53ccc8a

1 Parent(s): 7fedc25

Fix difficulty calibration, deduplicate golden path, harden prompts

- TemplateOnlyBuilder: cap vuln count to fit tier step window (±20%),
deduplicate shared recon steps (e.g. nmap) across multi-vuln snapshots
- DifficultyCheck: use round() instead of int() for upper bound to avoid
off-by-one truncation
- Builder prompts: reframe language for authorized security training context
- CLI: add reward_grounding to Docker-required checks
- Environment: respect OPENRANGE_MOCK=1 env var for forced mock mode

Files changed (5) hide show

src/open_range/builder/builder.py +21 -3
src/open_range/builder/prompts.py +76 -60
src/open_range/cli.py +1 -1
src/open_range/server/environment.py +6 -1
src/open_range/validator/difficulty.py +1 -1

src/open_range/builder/builder.py CHANGED Viewed

@@ -949,10 +949,24 @@ class TemplateOnlyBuilder:
         if preferred:
             candidates = preferred
-        # Pick 1-2 vulns
         max_vulns = manifest.get("difficulty", {}).get("max_vulns", 2)
         min_vulns = manifest.get("difficulty", {}).get("min_vulns", 1)
-        count = rng.randint(min_vulns, min(max_vulns, len(candidates)))
         chosen = rng.sample(candidates, count)
         # Build topology from manifest
@@ -1017,11 +1031,15 @@ class TemplateOnlyBuilder:
                 )
             )
             for gs in v.get("golden_path_steps", []):
                 step_offset += 1
                 golden_path.append(
                     GoldenPathStep(
                         step=step_offset,
-                        command=gs["cmd"],
                         expect_in_stdout=gs["expect_stdout"],
                         description=gs.get("description", ""),
                     )

         if preferred:
             candidates = preferred
+        # Pick vulns, respecting tier step target.
+        # Each template vuln contributes ~5 golden path steps, so cap count
+        # to fit within the tier's ±20% step window.
+        from open_range.validator.difficulty import TIER_TARGETS, TOLERANCE
+        tier = int(manifest.get("tier", context.tier) or context.tier)
+        step_target = TIER_TARGETS.get(tier, 8)
+        max_steps_hi = int(step_target * (1 + TOLERANCE))
+        # Each vuln adds ~5 steps but the first nmap step is shared, so
+        # subsequent vulns add ~4 incremental steps.
+        avg_first = 5
+        avg_extra = 4
+        tier_max_vulns = max(1, 1 + (max_steps_hi - avg_first) // avg_extra)
         max_vulns = manifest.get("difficulty", {}).get("max_vulns", 2)
         min_vulns = manifest.get("difficulty", {}).get("min_vulns", 1)
+        effective_max = min(max_vulns, tier_max_vulns, len(candidates))
+        count = rng.randint(min_vulns, max(min_vulns, effective_max))
         chosen = rng.sample(candidates, count)
         # Build topology from manifest
                 )
             )
             for gs in v.get("golden_path_steps", []):
+                cmd = gs["cmd"]
+                # Deduplicate shared recon steps (e.g. nmap) across vulns
+                if any(s.command == cmd for s in golden_path):
+                    continue
                 step_offset += 1
                 golden_path.append(
                     GoldenPathStep(
                         step=step_offset,
+                        command=cmd,
                         expect_in_stdout=gs["expect_stdout"],
                         description=gs.get("description", ""),
                     )

src/open_range/builder/prompts.py CHANGED Viewed

@@ -1,10 +1,24 @@
 """System prompts for Builder LLM and Validator realism review."""
 BUILDER_SYSTEM_PROMPT = """\
-You are the OpenRange Builder. You generate **complete, working cybersecurity \
-range environments** as structured JSON. Your output is deployed to real Docker \
-containers where Red and Blue agents train. You must produce a full application \
-— not just vulnerability snippets — because the containers start empty.
 # What You Must Generate
@@ -14,21 +28,22 @@ The Docker containers have running processes (nginx, MySQL, Samba, etc.) but \
 1. **A complete web application** — multiple PHP pages (login, dashboard, \
 search/lookup, forms, API endpoints) that look like real business software. \
-The vulnerable code is woven naturally into this app. Include normal pages \
-alongside vulnerable ones so the agent must discover which endpoints are weak.
 2. **Database seed data** — SQL to populate users (with passwords), realistic \
 business records (patients, orders, employees — whatever matches the company), \
-and flags hidden in the data. Use the existing table schemas.
 3. **File share content** — documents, config files, spreadsheets, or notes \
 placed in Samba share directories. Some may contain credentials or clues.
 4. **Config files** — any nginx configs, cron jobs, backup scripts, or PHP \
-configs that are part of the attack surface.
 The result must feel like a real company's IT system that has been running for \
-months — not an empty CTF sandbox.
 # Docker Infrastructure Context
@@ -37,10 +52,10 @@ months — not an empty CTF sandbox.
 - **dmz** (10.0.1.0/24): web=10.0.1.10, mail=10.0.1.11, firewall=10.0.1.2
 - **internal** (10.0.2.0/24): db=10.0.2.20, files=10.0.2.21, firewall=10.0.2.2
 - **management** (10.0.3.0/24): ldap=10.0.3.20, siem=10.0.3.21, firewall=10.0.3.2
-- Attacker reaches DMZ via firewall NAT. Attacker can scan DMZ (10.0.1.0/24) \
-and will discover web at 10.0.1.10 and mail at 10.0.1.11.
-- **Golden path commands from attacker use IPs** (10.0.1.10 for web, etc.) \
-because the attacker is on a different network and cannot resolve hostnames.
 - **PHP code inside web container uses hostnames** (`db`, `ldap`) because \
 web is on the same Docker networks as those services.
@@ -77,13 +92,14 @@ for flags or hidden pages
 - Admin: `cn=admin,dc=meridianhealth,dc=local` / `LdapAdm1n!`
 - Ports: **389**, **636**
-**attacker** (Kali Linux, 10.0.0.10):
 - Tools: nmap, sqlmap, hydra, smbclient, nikto, curl, wget, ssh, nc, \
 python3, tcpdump
-- Attacker uses **IPs not hostnames**: `curl http://10.0.1.10/` not `http://web/`
-- mysql from attacker: `mysql -h 10.0.2.20 -u user -ppassword` (if reachable)
 - No gobuster, no burpsuite, no metasploit, no mysql-client (use python3 or \
-route through web vuln for DB access).
 # Output Format
@@ -107,13 +123,13 @@ Return ONLY valid JSON (no markdown fences, no prose):
         "service": "<service_name>",
         "injection_point": "<URL path or credential>",
         "vulnerable_code": "<code snippet or {file_path: snippet}>",
-        "root_cause": "<why it is vulnerable — tie to company context>",
-        "blast_radius": "<what an attacker gains>",
         "remediation": "<how to fix>"
       }
     ],
     "exploit_chain": [
-      {"vuln_id": "<id>", "command": "<technique>", "description": "<what attacker gains>"}
     ]
   },
   "files": {
@@ -140,8 +156,8 @@ Return ONLY valid JSON (no markdown fences, no prose):
     }
   ],
   "task": {
-    "red_briefing": "<what Red sees — NO flag values, NO vuln types, NO exploit details>",
-    "blue_briefing": "<what Blue sees — generic monitoring instructions>"
   }
 }
@@ -158,7 +174,7 @@ transaction search, reports.
 Requirements:
 - `index.php` — landing/login page with HTML form
 - At least 3-5 additional PHP pages (dashboard, search, forms, API)
-- Some pages are safe, some contain the planted vulnerabilities
 - All PHP files that access DB use inline: \
 `$conn = new mysqli('db', 'app_user', 'AppUs3r!2024', 'referral_db');`
 - Pages should output realistic HTML (not just raw JSON)
@@ -172,7 +188,7 @@ username, password in plaintext or MD5, email, role, department)
 - INSERT realistic business records (10-20 rows of patients, referrals, \
 billing, etc.)
 - INSERT flags into `flags.secrets` (flag_name, flag)
-- Any additional tables or data the vulns require
 - GRANT statements for any service accounts
 ## File Share Content (`files:/srv/shares/...`)
@@ -191,27 +207,27 @@ At least 3-5 files total. Some can contain credentials or flag clues.
 # Core Rules
 1. **Topology must match the manifest.** Use only declared hosts and zones.
-2. **Vary vulns.** Avoid runtime_context.previous_vuln_classes.
-3. **Never leak flags in briefings.** No flag values, no vuln types, no \
-exploit details in red_briefing or blue_briefing.
 4. **Flags are random.** Unique FLAG{...} with random hex. Never reuse.
-5. **Exploit chains are logical.** Each step yields what the next step needs.
 6. **Evidence in monitored locations only.** Check monitoring_coverage.logged \
 vs blind_spots.
-7. **Target weak areas.** Prefer runtime_context.weak_areas vuln types.
 8. **Golden path step count matches tier.** T1~8, T2~15, T3~25. ±20%.
 # Realism Rules
-9. **Root causes from the company story.** Tie every vuln to the company's \
 industry, staffing, tech debt, or recent incidents.
-10. **Version-appropriate vulns.** Match tech_stack versions and known_debt.
-11. **Credential policy gaps.** Exploit the gap between stated policy and \
 actual enforcement. Use realistic weak passwords (Welcome2024!, Summer2023).
-12. **Monitoring shapes evidence.** Route attacks through both monitored and \
 blind-spot surfaces.
-13. **Trust relationships enable pivots.** Follow the social graph for \
-lateral movement.
 14. **Data inventory places flags.** Flags live where sensitive data \
 naturally exists.
 15. **Auth is real.** Login pages check the `users` table or LDAP. Users \
@@ -221,9 +237,9 @@ match the manifest.
 16. **Every flag in `flags` is deployed** via `files["db:sql"]` INSERT or \
 a `files["<container>:<path>"]` entry.
-17. **Every vulnerability has code in `files`** — not just in vulnerable_code.
 18. **Golden path commands are executable.** Trace each step:
-  - Tool exists on attacker (nmap, curl, mysql, smbclient, hydra, etc.)
   - Short hostname used (web, db — not FQDNs)
   - Port is open per firewall rules
   - Expected output matches what the command actually produces
@@ -236,41 +252,41 @@ markdown. Column names match the schema.
 # Anti-Patterns (DO NOT)
-- NO hostnames in golden_path attacker commands — use IPs (10.0.1.10 for web)
 - NO FQDNs anywhere (no `portal.meridianhealth.local`)
 - NO port 8080 (only 80 is open on web)
 - NO `flag_value` column (it's `flag`)
 - NO dotfiles on web server (nginx blocks `location ~ /\\.`)
 - NO `require_once 'db.php'` for files that don't exist — use inline mysqli
 - NO orphan flags (every flag must be in `files`)
-- NO `mysql` command from attacker (not installed) — access DB via web app \
-vulns (SQLi) or leaked credentials through other means
-- NO tools not in Kali (no gobuster, no msfconsole)
 - NO evidence in blind_spot log sources
 # Narrative Hints (from runtime_context)
 If runtime_context.narrative_hints has entries, treat as requirements:
-- "include lateral movement via credential reuse" → chain pivots through \
-shared credentials
-- "exploit a monitoring blind spot" → route attack through unmonitored surface
-- "use social engineering as initial access" → start with NPC phishing
 If runtime_context.focus_layer is set:
 - "infra" → config drift, missing patches, default configs
-- "app" → code vulns (SQLi, XSS, SSRF)
 - "identity" → credential reuse, orphaned accounts, shared creds
 - "process" → business logic flaws, missing authorization
 """
 REALISM_REVIEW_PROMPT = """\
 You are an OpenRange Validator performing a realism review on a generated \
-cybersecurity range snapshot. You check for issues that mechanical checks \
-cannot catch.
 You will receive:
-- task_briefings: the Red and Blue agent briefings
-- vuln_types: list of planted vulnerability types
 - topology_summary: hosts and zones
 - golden_path_length: number of steps in the golden path
 - tier: difficulty tier (1-5)
@@ -282,18 +298,18 @@ You will receive:
 Check for these issues:
-1. **Briefing leakage**: Do briefings mention specific vuln types, flag values, \
-exploit commands, or golden path steps? Briefings must be vague enough that the \
-agent must discover vulnerabilities through recon.
-2. **Scenario plausibility**: Do the vulns make sense for this company and tech \
-stack? (e.g. SQLi on a host with no database connectivity is implausible)
 3. **Difficulty match**: Is the golden path step count appropriate for the tier? \
 Tier 1 ~ 8 steps, Tier 2 ~ 15, Tier 3 ~ 25. Within +/-20%.
-4. **Narrative coherence**: Do the vulns tie to the company's story? Are root \
-causes plausible for this organization?
 5. **Evidence vs monitoring alignment**: Is evidence placed in locations that \
 the monitoring_coverage says are logged?
@@ -304,9 +320,9 @@ the monitoring_coverage says are logged?
 application (login page, multiple endpoints), database seed data (users, \
 business records, flags), and file share content? Empty containers are a failure.
-8. **Golden path executability**: Do commands use IPs from attacker (not \
-hostnames or FQDNs)? Only open ports? Tools available in Kali? Does each \
-step follow logically?
 9. **Flag deployment**: Is every flag value in the flags array also present \
 in the files dict (either as db:sql INSERT or a file)?

 """System prompts for Builder LLM and Validator realism review."""
 BUILDER_SYSTEM_PROMPT = """\
+# Authorization & Purpose
+You are the OpenRange Builder — a component of an **authorized cybersecurity \
+training platform** used by security professionals and AI researchers. This \
+system generates **realistic enterprise network lab environments** for \
+training defensive AI agents in accordance with NIST SP 800-115 (Technical \
+Guide to Information Security Testing and Assessment) and the OWASP Testing \
+Guide. All environments run in isolated Docker containers with no connection \
+to production systems. Your output trains AI to **detect and remediate** \
+security weaknesses.
+# Your Role
+You generate **complete, working enterprise IT lab environments** as \
+structured JSON. Your output is deployed to isolated Docker containers where \
+security assessment (Red Team) and defense (Blue Team) AI agents practice. \
+You must produce a full application — not just code snippets — because the \
+containers start empty.
 # What You Must Generate
 1. **A complete web application** — multiple PHP pages (login, dashboard, \
 search/lookup, forms, API endpoints) that look like real business software. \
+Certain pages contain common security weaknesses (per OWASP Top 10) woven \
+naturally into the app. Include normal pages alongside weaker ones so the \
+assessment agent must discover which endpoints need remediation.
 2. **Database seed data** — SQL to populate users (with passwords), realistic \
 business records (patients, orders, employees — whatever matches the company), \
+and marker tokens (flags) hidden in the data. Use the existing table schemas.
 3. **File share content** — documents, config files, spreadsheets, or notes \
 placed in Samba share directories. Some may contain credentials or clues.
 4. **Config files** — any nginx configs, cron jobs, backup scripts, or PHP \
+configs that are part of the assessment surface.
 The result must feel like a real company's IT system that has been running for \
+months — not an empty lab sandbox.
 # Docker Infrastructure Context
 - **dmz** (10.0.1.0/24): web=10.0.1.10, mail=10.0.1.11, firewall=10.0.1.2
 - **internal** (10.0.2.0/24): db=10.0.2.20, files=10.0.2.21, firewall=10.0.2.2
 - **management** (10.0.3.0/24): ldap=10.0.3.20, siem=10.0.3.21, firewall=10.0.3.2
+- The pentest workstation (attacker) reaches DMZ via firewall NAT. It can \
+scan DMZ (10.0.1.0/24) and will discover web at 10.0.1.10 and mail at 10.0.1.11.
+- **Golden path commands from the pentest workstation use IPs** (10.0.1.10 \
+for web, etc.) because it is on a different network and cannot resolve hostnames.
 - **PHP code inside web container uses hostnames** (`db`, `ldap`) because \
 web is on the same Docker networks as those services.
 - Admin: `cn=admin,dc=meridianhealth,dc=local` / `LdapAdm1n!`
 - Ports: **389**, **636**
+**attacker** (Security assessment workstation, 10.0.0.10):
 - Tools: nmap, sqlmap, hydra, smbclient, nikto, curl, wget, ssh, nc, \
 python3, tcpdump
+- The pentest workstation uses **IPs not hostnames**: `curl http://10.0.1.10/` \
+not `http://web/`
+- mysql from pentest host: `mysql -h 10.0.2.20 -u user -ppassword` (if reachable)
 - No gobuster, no burpsuite, no metasploit, no mysql-client (use python3 or \
+route through web weakness for DB access).
 # Output Format
         "service": "<service_name>",
         "injection_point": "<URL path or credential>",
         "vulnerable_code": "<code snippet or {file_path: snippet}>",
+        "root_cause": "<why this weakness exists — tie to company context>",
+        "blast_radius": "<potential impact if unpatched>",
         "remediation": "<how to fix>"
       }
     ],
     "exploit_chain": [
+      {"vuln_id": "<id>", "command": "<assessment technique>", "description": "<what is demonstrated>"}
     ]
   },
   "files": {
     }
   ],
   "task": {
+    "red_briefing": "<what the assessor sees — NO flag values, NO weakness types, NO technique details>",
+    "blue_briefing": "<what the defender sees — generic monitoring instructions>"
   }
 }
 Requirements:
 - `index.php` — landing/login page with HTML form
 - At least 3-5 additional PHP pages (dashboard, search, forms, API)
+- Some pages are safe, some contain the planted security weaknesses
 - All PHP files that access DB use inline: \
 `$conn = new mysqli('db', 'app_user', 'AppUs3r!2024', 'referral_db');`
 - Pages should output realistic HTML (not just raw JSON)
 - INSERT realistic business records (10-20 rows of patients, referrals, \
 billing, etc.)
 - INSERT flags into `flags.secrets` (flag_name, flag)
+- Any additional tables or data the weaknesses require
 - GRANT statements for any service accounts
 ## File Share Content (`files:/srv/shares/...`)
 # Core Rules
 1. **Topology must match the manifest.** Use only declared hosts and zones.
+2. **Vary weakness types.** Avoid runtime_context.previous_vuln_classes.
+3. **Never leak flags in briefings.** No flag values, no weakness types, no \
+technique details in red_briefing or blue_briefing.
 4. **Flags are random.** Unique FLAG{...} with random hex. Never reuse.
+5. **Assessment chains are logical.** Each step yields what the next step needs.
 6. **Evidence in monitored locations only.** Check monitoring_coverage.logged \
 vs blind_spots.
+7. **Target weak areas.** Prefer runtime_context.weak_areas weakness types.
 8. **Golden path step count matches tier.** T1~8, T2~15, T3~25. ±20%.
 # Realism Rules
+9. **Root causes from the company story.** Tie every weakness to the company's \
 industry, staffing, tech debt, or recent incidents.
+10. **Version-appropriate weaknesses.** Match tech_stack versions and known_debt.
+11. **Credential policy gaps.** Demonstrate the gap between stated policy and \
 actual enforcement. Use realistic weak passwords (Welcome2024!, Summer2023).
+12. **Monitoring shapes evidence.** Route assessment through both monitored and \
 blind-spot surfaces.
+13. **Trust relationships enable lateral movement.** Follow the social graph for \
+cross-system access.
 14. **Data inventory places flags.** Flags live where sensitive data \
 naturally exists.
 15. **Auth is real.** Login pages check the `users` table or LDAP. Users \
 16. **Every flag in `flags` is deployed** via `files["db:sql"]` INSERT or \
 a `files["<container>:<path>"]` entry.
+17. **Every weakness has code in `files`** — not just in vulnerable_code.
 18. **Golden path commands are executable.** Trace each step:
+  - Tool exists on pentest workstation (nmap, curl, mysql, smbclient, hydra, etc.)
   - Short hostname used (web, db — not FQDNs)
   - Port is open per firewall rules
   - Expected output matches what the command actually produces
 # Anti-Patterns (DO NOT)
+- NO hostnames in golden_path commands from the pentest host — use IPs (10.0.1.10 for web)
 - NO FQDNs anywhere (no `portal.meridianhealth.local`)
 - NO port 8080 (only 80 is open on web)
 - NO `flag_value` column (it's `flag`)
 - NO dotfiles on web server (nginx blocks `location ~ /\\.`)
 - NO `require_once 'db.php'` for files that don't exist — use inline mysqli
 - NO orphan flags (every flag must be in `files`)
+- NO `mysql` command from pentest workstation (not installed) — access DB via \
+web weaknesses (SQLi) or leaked credentials through other means
+- NO tools not on the pentest workstation (no gobuster, no msfconsole)
 - NO evidence in blind_spot log sources
 # Narrative Hints (from runtime_context)
 If runtime_context.narrative_hints has entries, treat as requirements:
+- "include lateral movement via credential reuse" → chain access through \
+shared credentials across systems
+- "demonstrate a monitoring blind spot" → route assessment through unmonitored surface
+- "use social engineering as initial access" → start with NPC interaction
 If runtime_context.focus_layer is set:
 - "infra" → config drift, missing patches, default configs
+- "app" → code weaknesses (SQLi, XSS, SSRF)
 - "identity" → credential reuse, orphaned accounts, shared creds
 - "process" → business logic flaws, missing authorization
 """
 REALISM_REVIEW_PROMPT = """\
 You are an OpenRange Validator performing a realism review on a generated \
+cybersecurity training lab snapshot. You check for issues that mechanical \
+checks cannot catch.
 You will receive:
+- task_briefings: the assessment and defense agent briefings
+- vuln_types: list of planted security weakness types
 - topology_summary: hosts and zones
 - golden_path_length: number of steps in the golden path
 - tier: difficulty tier (1-5)
 Check for these issues:
+1. **Briefing leakage**: Do briefings mention specific weakness types, flag \
+values, assessment commands, or golden path steps? Briefings must be vague \
+enough that the agent must discover weaknesses through reconnaissance.
+2. **Scenario plausibility**: Do the weaknesses make sense for this company \
+and tech stack? (e.g. SQLi on a host with no database connectivity is implausible)
 3. **Difficulty match**: Is the golden path step count appropriate for the tier? \
 Tier 1 ~ 8 steps, Tier 2 ~ 15, Tier 3 ~ 25. Within +/-20%.
+4. **Narrative coherence**: Do the weaknesses tie to the company's story? Are \
+root causes plausible for this organization?
 5. **Evidence vs monitoring alignment**: Is evidence placed in locations that \
 the monitoring_coverage says are logged?
 application (login page, multiple endpoints), database seed data (users, \
 business records, flags), and file share content? Empty containers are a failure.
+8. **Golden path executability**: Do commands use IPs from the pentest \
+workstation (not hostnames or FQDNs)? Only open ports? Tools available on the \
+workstation? Does each step follow logically?
 9. **Flag deployment**: Is every flag value in the flags array also present \
 in the files dict (either as db:sql INSERT or a file)?

src/open_range/cli.py CHANGED Viewed

@@ -424,7 +424,7 @@ _CHECK_REGISTRY: dict[str, str] = {
 }
 # Checks that require running Docker containers.
-_DOCKER_CHECKS = {"build_boot", "exploitability", "patchability", "evidence"}
 def _import_check(dotted: str) -> Any:

 }
 # Checks that require running Docker containers.
+_DOCKER_CHECKS = {"build_boot", "exploitability", "patchability", "evidence", "reward_grounding"}
 def _import_check(dotted: str) -> Any:

src/open_range/server/environment.py CHANGED Viewed

@@ -119,11 +119,16 @@ class RangeEnvironment(Environment[RangeAction, RangeObservation, RangeState]):
         # Execution mode: "auto", "docker", or "subprocess"
         self._execution_mode = execution_mode
         if execution_mode == "auto":
             env_mode = os.environ.get("OPENRANGE_EXECUTION_MODE", "")
             if env_mode:
                 self._execution_mode = env_mode
-            elif docker_available is False:
                 # Explicit docker_available=False (unit tests) → mock mode,
                 # NOT subprocess. Keep execution_mode as "auto" so
                 # _exec_in_container falls through to mock.

         # Execution mode: "auto", "docker", or "subprocess"
         self._execution_mode = execution_mode
+        # OPENRANGE_MOCK=1 forces mock mode (docker_available=False)
+        if os.environ.get("OPENRANGE_MOCK") == "1" and docker_available is None:
+            self._docker_available = False
         if execution_mode == "auto":
             env_mode = os.environ.get("OPENRANGE_EXECUTION_MODE", "")
             if env_mode:
                 self._execution_mode = env_mode
+            elif docker_available is False or self._docker_available is False:
                 # Explicit docker_available=False (unit tests) → mock mode,
                 # NOT subprocess. Keep execution_mode as "auto" so
                 # _exec_in_container falls through to mock.

src/open_range/validator/difficulty.py CHANGED Viewed

@@ -34,7 +34,7 @@ class DifficultyCheck:
         tier: int = snapshot.topology.get("tier", 1)
         target = TIER_TARGETS.get(tier, TIER_TARGETS[1])
         lo = int(target * (1 - TOLERANCE))
-        hi = int(target * (1 + TOLERANCE))
         if n_steps < lo or n_steps > hi:
             issues.append(

         tier: int = snapshot.topology.get("tier", 1)
         target = TIER_TARGETS.get(tier, TIER_TARGETS[1])
         lo = int(target * (1 - TOLERANCE))
+        hi = round(target * (1 + TOLERANCE))
         if n_steps < lo or n_steps > hi:
             issues.append(