Skyvern/tests/unit/test_script_reviewer_validators.py

306 lines
13 KiB
Python

"""Tests for ScriptReviewer validation methods."""
from skyvern.services.script_reviewer import ScriptReviewer
class TestValidateNoHardcodedValues:
"""Tests for _validate_no_hardcoded_values."""
def setup_method(self) -> None:
self.reviewer = ScriptReviewer()
def test_no_params_returns_none(self) -> None:
code = 'await page.click(selector="button")'
assert self.reviewer._validate_no_hardcoded_values(code, None) is None
assert self.reviewer._validate_no_hardcoded_values(code, {}) is None
def test_short_values_ignored(self) -> None:
"""Values shorter than 5 chars should not trigger (too many false positives)."""
code = """
async def block_fn(page, context):
if 'yes' == 'yes':
return {"next_block_label": "send_email", "branch_index": 0}
"""
params = {"flag": "yes", "ok": "true"}
assert self.reviewer._validate_no_hardcoded_values(code, params) is None
def test_detects_hardcoded_email(self) -> None:
"""Should catch a hardcoded email that should be context.parameters['recipient']."""
code = """
async def block_fn(page, context):
recipient = 'billing@acme-test.example.com'
if recipient != "":
return {"next_block_label": "send_email", "branch_index": 0}
"""
params = {"recipient": "billing@acme-test.example.com"}
error = self.reviewer._validate_no_hardcoded_values(code, params)
assert error is not None
assert "hardcoded" in error.lower()
assert "recipient" in error
assert "context.parameters" in error
def test_detects_hardcoded_url(self) -> None:
"""Should catch a hardcoded URL that should be context.parameters['website_url']."""
code = """
async def login(page, context):
await page.goto('https://portal.vendor.com/login')
await page.fill(selector='input[name="email"]', value=context.parameters['email'])
"""
params = {"website_url": "https://portal.vendor.com/login", "email": "user@example.com"}
error = self.reviewer._validate_no_hardcoded_values(code, params)
assert error is not None
assert "website_url" in error
def test_allows_context_parameters_reference(self) -> None:
"""Using context.parameters['key'] should NOT trigger the validator."""
code = """
async def block_fn(page, context):
recipient = context.parameters.get('recipient', '')
if recipient != "":
return {"next_block_label": "send_email", "branch_index": 0}
"""
params = {"recipient": "billing@acme-test.example.com"}
assert self.reviewer._validate_no_hardcoded_values(code, params) is None
def test_allows_non_parameter_literals(self) -> None:
"""String literals that aren't parameter values should be fine."""
code = """
async def block_fn(page, context):
await page.click(selector='button:has-text("Sign in")', ai='fallback', prompt='Click sign in')
"""
params = {"email": "user@example.com", "password": "secret123"}
assert self.reviewer._validate_no_hardcoded_values(code, params) is None
def test_ignores_comments(self) -> None:
"""Values in comments should not trigger."""
code = """
async def block_fn(page, context):
# billing@acme-test.example.com is the test email
recipient = context.parameters.get('recipient', '')
if recipient != "":
return {"next_block_label": "send_email", "branch_index": 0}
"""
params = {"recipient": "billing@acme-test.example.com"}
assert self.reviewer._validate_no_hardcoded_values(code, params) is None
def test_detects_multiple_hardcoded_values(self) -> None:
"""Should report multiple hardcoded values."""
code = """
async def block_fn(page, context):
await page.goto('https://portal.vendor.com/login')
await page.fill(selector='input', value='billing@acme-test.example.com')
"""
params = {
"website_url": "https://portal.vendor.com/login",
"recipient": "billing@acme-test.example.com",
}
error = self.reviewer._validate_no_hardcoded_values(code, params)
assert error is not None
assert "2 hardcoded" in error
def test_allows_block_labels_and_keywords(self) -> None:
"""Common structural strings like block labels should not trigger."""
code = """
async def block_fn(page, context):
return {"next_block_label": "send_email", "branch_index": 0}
"""
# Even if "send_email" is technically a value somewhere, it's a block label
params = {"account_number": "12345678"}
assert self.reviewer._validate_no_hardcoded_values(code, params) is None
class TestValidateParameterPreservation:
"""Tests for _validate_parameter_preservation."""
def setup_method(self) -> None:
self.reviewer = ScriptReviewer()
def test_no_existing_code_returns_none(self) -> None:
new_code = "await page.fill(selector='#email', ai='proactive', prompt='email')"
assert self.reviewer._validate_parameter_preservation(new_code, None, ["email"]) is None
def test_no_parameter_keys_returns_none(self) -> None:
old_code = "await page.fill(selector='#email', value=context.parameters['email'])"
new_code = "await page.fill(selector='#email', ai='proactive', prompt='email')"
assert self.reviewer._validate_parameter_preservation(new_code, old_code, []) is None
def test_preserved_refs_returns_none(self) -> None:
"""When all parameter refs are preserved, validation passes."""
old_code = """
await page.fill(selector='#email', value=context.parameters['email'])
await page.fill(selector='#pass', value=context.parameters['password'])
"""
new_code = """
choice = await page.classify(...)
if choice == 0:
await page.fill(selector='#email', value=context.parameters['email'])
await page.fill(selector='#pass', value=context.parameters['password'])
"""
assert self.reviewer._validate_parameter_preservation(new_code, old_code, ["email", "password"]) is None
def test_detects_dropped_refs(self) -> None:
"""When the LLM drops value= refs, validation catches it."""
old_code = """
await page.fill(selector='#email', value=context.parameters['email'])
await page.fill(selector='#pass', value=context.parameters['password'])
"""
new_code = """
choice = await page.classify(...)
if choice == 0:
await page.fill(selector='#email', ai='proactive', prompt='fill email')
await page.fill(selector='#pass', ai='proactive', prompt='fill password')
"""
error = self.reviewer._validate_parameter_preservation(new_code, old_code, ["email", "password"])
assert error is not None
assert "email" in error
assert "password" in error
assert "dropped" in error.lower()
def test_ignores_refs_not_in_parameter_keys(self) -> None:
"""Spurious refs in old code that aren't valid keys should be ignored."""
old_code = "await page.fill(selector='#x', value=context.parameters['invented_key'])"
new_code = "await page.fill(selector='#x', ai='proactive', prompt='fill x')"
assert self.reviewer._validate_parameter_preservation(new_code, old_code, ["email", "password"]) is None
def test_partial_drop_detected(self) -> None:
"""Dropping one ref while keeping another should flag only the dropped one."""
old_code = """
await page.fill(selector='#email', value=context.parameters['email'])
await page.fill(selector='#pass', value=context.parameters['password'])
"""
new_code = """
await page.fill(selector='#email', value=context.parameters['email'])
await page.fill(selector='#pass', ai='proactive', prompt='fill password')
"""
error = self.reviewer._validate_parameter_preservation(new_code, old_code, ["email", "password"])
assert error is not None
assert "context.parameters['password']" in error
assert "context.parameters['email']" not in error
def test_commented_ref_in_new_code_counts_as_dropped(self) -> None:
"""A parameter ref only in a comment in new code should be flagged as dropped."""
old_code = "await page.fill(selector='#email', value=context.parameters['email'])"
new_code = """
# was: context.parameters['email']
await page.fill(selector='#email', ai='proactive', prompt='fill email')
"""
error = self.reviewer._validate_parameter_preservation(new_code, old_code, ["email"])
assert error is not None
assert "email" in error
class TestValidateBranchReturns:
"""Tests for _validate_branch_returns."""
BRANCHES_TWO = [
{"original_expression": "x > 0", "next_block_label": "block_3", "is_default": False},
{"original_expression": None, "next_block_label": "block_4", "is_default": True},
]
def test_valid_returns_passes(self) -> None:
code = """
async def block_fn(page, context):
if context.parameters.get('x', 0) > 0:
return {"next_block_label": "block_3", "branch_index": 0}
else:
return {"next_block_label": "block_4", "branch_index": 1}
"""
assert ScriptReviewer._validate_branch_returns(code, self.BRANCHES_TWO) is None
def test_invalid_label_detected(self) -> None:
"""Labels not in the branch definitions should be flagged."""
code = """
async def block_fn(page, context):
if context.parameters.get('x', 0) > 0:
return {"next_block_label": "block_99", "branch_index": 0}
else:
return {"next_block_label": "block_4", "branch_index": 1}
"""
error = ScriptReviewer._validate_branch_returns(code, self.BRANCHES_TWO)
assert error is not None
assert "block_99" in error
def test_invalid_index_detected(self) -> None:
"""branch_index values outside 0..N-1 should be flagged."""
code = """
async def block_fn(page, context):
if context.parameters.get('x', 0) > 0:
return {"next_block_label": "block_3", "branch_index": 0}
else:
return {"next_block_label": "block_4", "branch_index": -1}
"""
error = ScriptReviewer._validate_branch_returns(code, self.BRANCHES_TWO)
assert error is not None
assert "-1" in error
def test_none_label_invalid_when_not_in_branches(self) -> None:
"""None next_block_label should be flagged when no branch has a null target."""
code = """
async def block_fn(page, context):
if context.parameters.get('x', 0) > 0:
return {"next_block_label": "block_3", "branch_index": 0}
else:
return {"next_block_label": None, "branch_index": 1}
"""
error = ScriptReviewer._validate_branch_returns(code, self.BRANCHES_TWO)
assert error is not None
assert "next_block_label" in error
def test_none_label_valid_when_in_branches(self) -> None:
"""None next_block_label should pass when a branch has a null target."""
branches = [
{"original_expression": "x > 0", "next_block_label": "block_3", "is_default": False},
{"original_expression": None, "next_block_label": None, "is_default": True},
]
code = """
async def block_fn(page, context):
if context.parameters.get('x', 0) > 0:
return {"next_block_label": "block_3", "branch_index": 0}
else:
return {"next_block_label": None, "branch_index": 1}
"""
assert ScriptReviewer._validate_branch_returns(code, branches) is None
def test_no_literals_passes(self) -> None:
"""Code using variables (not literals) should pass — can't validate statically."""
code = """
async def block_fn(page, context):
label = compute_label()
idx = compute_index()
return {"next_block_label": label, "branch_index": idx}
"""
assert ScriptReviewer._validate_branch_returns(code, self.BRANCHES_TWO) is None
def test_comments_ignored(self) -> None:
"""Values in comments should not trigger validation."""
code = """
async def block_fn(page, context):
# return {"next_block_label": "block_99", "branch_index": -1}
if context.parameters.get('x', 0) > 0:
return {"next_block_label": "block_3", "branch_index": 0}
else:
return {"next_block_label": "block_4", "branch_index": 1}
"""
assert ScriptReviewer._validate_branch_returns(code, self.BRANCHES_TWO) is None
def test_empty_branches_passes(self) -> None:
assert ScriptReviewer._validate_branch_returns("return {}", []) is None
def test_single_quotes_handled(self) -> None:
"""Single-quoted keys should be parsed correctly."""
code = """
async def block_fn(page, context):
return {'next_block_label': 'block_3', 'branch_index': 0}
"""
assert ScriptReviewer._validate_branch_returns(code, self.BRANCHES_TWO) is None
def test_both_label_and_index_invalid(self) -> None:
"""Both invalid label and index should be reported."""
code = """
async def block_fn(page, context):
return {"next_block_label": "wrong_label", "branch_index": -1}
"""
error = ScriptReviewer._validate_branch_returns(code, self.BRANCHES_TWO)
assert error is not None
assert "wrong_label" in error
assert "-1" in error