complete_on_downloads for task block (#403)

This commit is contained in:
Kerem Yilmaz 2024-06-02 23:24:30 -07:00 committed by GitHub
parent 343937e12c
commit f1d5a3a687
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
9 changed files with 118 additions and 30 deletions

View file

@ -23,6 +23,7 @@ from skyvern.exceptions import (
from skyvern.forge import app from skyvern.forge import app
from skyvern.forge.async_operations import AgentPhase, AsyncOperationPool from skyvern.forge.async_operations import AgentPhase, AsyncOperationPool
from skyvern.forge.prompts import prompt_engine from skyvern.forge.prompts import prompt_engine
from skyvern.forge.sdk.api.files import get_number_of_files_in_directory, get_path_for_workflow_download_directory
from skyvern.forge.sdk.artifact.models import ArtifactType from skyvern.forge.sdk.artifact.models import ArtifactType
from skyvern.forge.sdk.core import skyvern_context from skyvern.forge.sdk.core import skyvern_context
from skyvern.forge.sdk.core.security import generate_skyvern_signature from skyvern.forge.sdk.core.security import generate_skyvern_signature
@ -195,10 +196,18 @@ class ForgeAgent:
api_key: str | None = None, api_key: str | None = None,
workflow_run: WorkflowRun | None = None, workflow_run: WorkflowRun | None = None,
close_browser_on_completion: bool = True, close_browser_on_completion: bool = True,
# If complete_on_download is True and there is a workflow run, the task will be marked as completed
# if a download happens during the step execution.
complete_on_download: bool = False,
) -> Tuple[Step, DetailedAgentStepOutput | None, Step | None]: ) -> Tuple[Step, DetailedAgentStepOutput | None, Step | None]:
next_step: Step | None = None next_step: Step | None = None
detailed_output: DetailedAgentStepOutput | None = None detailed_output: DetailedAgentStepOutput | None = None
num_files_before = 0
try: try:
if task.workflow_run_id:
num_files_before = get_number_of_files_in_directory(
get_path_for_workflow_download_directory(task.workflow_run_id)
)
# Check some conditions before executing the step, throw an exception if the step can't be executed # Check some conditions before executing the step, throw an exception if the step can't be executed
await app.AGENT_FUNCTION.validate_step_execution(task, step) await app.AGENT_FUNCTION.validate_step_execution(task, step)
( (
@ -214,6 +223,30 @@ class ForgeAgent:
task = await self.update_task_errors_from_detailed_output(task, detailed_output) task = await self.update_task_errors_from_detailed_output(task, detailed_output)
retry = False retry = False
if complete_on_download and task.workflow_run_id:
num_files_after = get_number_of_files_in_directory(
get_path_for_workflow_download_directory(task.workflow_run_id)
)
if num_files_after > num_files_before:
LOG.info(
"Task marked as completed due to download",
task_id=task.task_id,
num_files_before=num_files_before,
num_files_after=num_files_after,
)
last_step = await self.update_step(step, is_last=True)
completed_task = await self.update_task(
task,
status=TaskStatus.completed,
)
await self.send_task_response(
task=completed_task,
last_step=last_step,
api_key=api_key,
close_browser_on_completion=close_browser_on_completion,
)
return last_step, detailed_output, None
# If the step failed, mark the step as failed and retry # If the step failed, mark the step as failed and retry
if step.status == StepStatus.failed: if step.status == StepStatus.failed:
maybe_next_step = await self.handle_failed_step(organization, task, step) maybe_next_step = await self.handle_failed_step(organization, task, step)
@ -273,6 +306,7 @@ class ForgeAgent:
next_step, next_step,
api_key=api_key, api_key=api_key,
close_browser_on_completion=close_browser_on_completion, close_browser_on_completion=close_browser_on_completion,
complete_on_download=complete_on_download,
) )
elif SettingsManager.get_settings().execute_all_steps() and next_step: elif SettingsManager.get_settings().execute_all_steps() and next_step:
return await self.execute_step( return await self.execute_step(
@ -281,6 +315,7 @@ class ForgeAgent:
next_step, next_step,
api_key=api_key, api_key=api_key,
close_browser_on_completion=close_browser_on_completion, close_browser_on_completion=close_browser_on_completion,
complete_on_download=complete_on_download,
) )
else: else:
LOG.info( LOG.info(

View file

@ -68,3 +68,13 @@ def zip_files(files_path: str, zip_file_path: str) -> str:
def get_path_for_workflow_download_directory(workflow_run_id: str) -> Path: def get_path_for_workflow_download_directory(workflow_run_id: str) -> Path:
return Path(f"{REPO_ROOT_DIR}/downloads/{workflow_run_id}/") return Path(f"{REPO_ROOT_DIR}/downloads/{workflow_run_id}/")
def get_number_of_files_in_directory(directory: Path, recursive: bool = False) -> int:
count = 0
for root, dirs, files in os.walk(directory):
if not recursive:
count += len(files)
break
count += len(files)
return count

View file

@ -217,7 +217,7 @@ class WorkflowRunContext:
self, parameter: OutputParameter, value: dict[str, Any] | list | str | None self, parameter: OutputParameter, value: dict[str, Any] | list | str | None
) -> None: ) -> None:
if parameter.key in self.values: if parameter.key in self.values:
LOG.error(f"Output parameter {parameter.output_parameter_id} already has a registered value") LOG.warning(f"Output parameter {parameter.output_parameter_id} already has a registered value")
return return
self.values[parameter.key] = value self.values[parameter.key] = value

View file

@ -71,6 +71,14 @@ class Block(BaseModel, abc.ABC):
workflow_run_id: str, workflow_run_id: str,
value: dict[str, Any] | list | str | None = None, value: dict[str, Any] | list | str | None = None,
) -> None: ) -> None:
if workflow_run_context.has_value(self.output_parameter.key):
LOG.warning(
"Output parameter value already recorded",
output_parameter_id=self.output_parameter.output_parameter_id,
workflow_run_id=workflow_run_id,
)
return
await workflow_run_context.register_output_parameter_value_post_execution( await workflow_run_context.register_output_parameter_value_post_execution(
parameter=self.output_parameter, parameter=self.output_parameter,
value=value, value=value,
@ -150,6 +158,7 @@ class TaskBlock(Block):
max_retries: int = 0 max_retries: int = 0
max_steps_per_run: int | None = None max_steps_per_run: int | None = None
parameters: list[PARAMETER_TYPE] = [] parameters: list[PARAMETER_TYPE] = []
complete_on_download: bool = False
def get_all_parameters( def get_all_parameters(
self, self,
@ -265,6 +274,7 @@ class TaskBlock(Block):
task=task, task=task,
step=step, step=step,
workflow_run=workflow_run, workflow_run=workflow_run,
complete_on_download=self.complete_on_download,
) )
except Exception as e: except Exception as e:
# Make sure the task is marked as failed in the database before raising the exception # Make sure the task is marked as failed in the database before raising the exception

View file

@ -87,6 +87,7 @@ class TaskBlockYAML(BlockYAML):
max_retries: int = 0 max_retries: int = 0
max_steps_per_run: int | None = None max_steps_per_run: int | None = None
parameter_keys: list[str] | None = None parameter_keys: list[str] | None = None
complete_on_download: bool = False
class ForLoopBlockYAML(BlockYAML): class ForLoopBlockYAML(BlockYAML):

View file

@ -969,6 +969,7 @@ class WorkflowService:
error_code_mapping=block_yaml.error_code_mapping, error_code_mapping=block_yaml.error_code_mapping,
max_steps_per_run=block_yaml.max_steps_per_run, max_steps_per_run=block_yaml.max_steps_per_run,
max_retries=block_yaml.max_retries, max_retries=block_yaml.max_retries,
complete_on_download=block_yaml.complete_on_download,
) )
elif block_yaml.block_type == BlockType.FOR_LOOP: elif block_yaml.block_type == BlockType.FOR_LOOP:
loop_blocks = [ loop_blocks = [

View file

@ -13,7 +13,11 @@ from skyvern.constants import REPO_ROOT_DIR
from skyvern.exceptions import ImaginaryFileUrl, MissingElement, MissingFileUrl, MultipleElementsFound from skyvern.exceptions import ImaginaryFileUrl, MissingElement, MissingFileUrl, MultipleElementsFound
from skyvern.forge import app from skyvern.forge import app
from skyvern.forge.prompts import prompt_engine from skyvern.forge.prompts import prompt_engine
from skyvern.forge.sdk.api.files import download_file from skyvern.forge.sdk.api.files import (
download_file,
get_number_of_files_in_directory,
get_path_for_workflow_download_directory,
)
from skyvern.forge.sdk.models import Step from skyvern.forge.sdk.models import Step
from skyvern.forge.sdk.schemas.tasks import Task from skyvern.forge.sdk.schemas.tasks import Task
from skyvern.forge.sdk.services.bitwarden import BitwardenConstants from skyvern.forge.sdk.services.bitwarden import BitwardenConstants
@ -162,17 +166,42 @@ async def handle_click_action(
task: Task, task: Task,
step: Step, step: Step,
) -> list[ActionResult]: ) -> list[ActionResult]:
num_downloaded_files_before = 0
download_dir = None
if task.workflow_run_id:
download_dir = get_path_for_workflow_download_directory(task.workflow_run_id)
num_downloaded_files_before = get_number_of_files_in_directory(download_dir)
LOG.info(
"Number of files in download directory before click",
num_downloaded_files_before=num_downloaded_files_before,
download_dir=download_dir,
)
xpath = await validate_actions_in_dom(action, page, scraped_page) xpath = await validate_actions_in_dom(action, page, scraped_page)
await asyncio.sleep(0.3) await asyncio.sleep(0.3)
if action.download: if action.download:
return await handle_click_to_download_file_action(action, page, scraped_page) results = await handle_click_to_download_file_action(action, page, scraped_page)
return await chain_click( else:
task, results = await chain_click(
page, task,
action, page,
xpath, action,
timeout=SettingsManager.get_settings().BROWSER_ACTION_TIMEOUT_MS, xpath,
) timeout=SettingsManager.get_settings().BROWSER_ACTION_TIMEOUT_MS,
)
if results and task.workflow_run_id and download_dir:
LOG.info("Sleeping for 5 seconds to let the download finish")
await asyncio.sleep(5)
num_downloaded_files_after = get_number_of_files_in_directory(download_dir)
LOG.info(
"Number of files in download directory after click",
num_downloaded_files_after=num_downloaded_files_after,
download_dir=download_dir,
)
if num_downloaded_files_after > num_downloaded_files_before:
results[-1].download_triggered = True
return results
async def handle_click_to_download_file_action( async def handle_click_to_download_file_action(
@ -677,16 +706,6 @@ async def chain_click(
page.on("filechooser", fc_func) page.on("filechooser", fc_func)
LOG.info("Registered file chooser listener", action=action, path=file) LOG.info("Registered file chooser listener", action=action, path=file)
# If a download is triggered due to the click, we need to let LLM know in action_results
download_triggered = False
def download_func(download: Any) -> None:
nonlocal download_triggered
download_triggered = True
page.on("download", download_func)
LOG.info("Registered download listener", action=action)
""" """
Clicks on an element identified by the xpath and its parent if failed. Clicks on an element identified by the xpath and its parent if failed.
:param xpath: xpath of the element to click :param xpath: xpath of the element to click
@ -698,7 +717,6 @@ async def chain_click(
return [ return [
ActionSuccess( ActionSuccess(
javascript_triggered=javascript_triggered, javascript_triggered=javascript_triggered,
download_triggered=download_triggered,
) )
] ]
except Exception as e: except Exception as e:
@ -706,7 +724,6 @@ async def chain_click(
ActionFailure( ActionFailure(
e, e,
javascript_triggered=javascript_triggered, javascript_triggered=javascript_triggered,
download_triggered=download_triggered,
) )
] ]
if await is_input_element(page.locator(xpath)): if await is_input_element(page.locator(xpath)):
@ -716,7 +733,6 @@ async def chain_click(
xpath=xpath, xpath=xpath,
) )
sibling_action_result = await click_sibling_of_input(page.locator(xpath), timeout=timeout) sibling_action_result = await click_sibling_of_input(page.locator(xpath), timeout=timeout)
sibling_action_result.download_triggered = download_triggered
action_results.append(sibling_action_result) action_results.append(sibling_action_result)
if type(sibling_action_result) == ActionSuccess: if type(sibling_action_result) == ActionSuccess:
return action_results return action_results
@ -736,7 +752,6 @@ async def chain_click(
ActionSuccess( ActionSuccess(
javascript_triggered=javascript_triggered, javascript_triggered=javascript_triggered,
interacted_with_parent=True, interacted_with_parent=True,
download_triggered=download_triggered,
) )
) )
except Exception as pe: except Exception as pe:
@ -765,7 +780,6 @@ async def chain_click(
if file: if file:
await asyncio.sleep(10) await asyncio.sleep(10)
page.remove_listener("filechooser", fc_func) page.remove_listener("filechooser", fc_func)
page.remove_listener("download", download_func)
def get_anchor_to_click(scraped_page: ScrapedPage, element_id: int) -> str | None: def get_anchor_to_click(scraped_page: ScrapedPage, element_id: int) -> str | None:

View file

@ -19,10 +19,26 @@ class ActionResult(BaseModel):
interacted_with_parent: bool | None = None interacted_with_parent: bool | None = None
def __str__(self) -> str: def __str__(self) -> str:
return ( results = ["ActionResult(success={self.success}"]
f"ActionResult(success={self.success}, exception_type={self.exception_type}, " if self.exception_type or self.exception_message:
f"exception_message={self.exception_message}), data={self.data}" results.append(f"exception_type={self.exception_type}")
) results.append(f"exception_message={self.exception_message}")
if self.data:
results.append(f"data={self.data}")
if self.step_order:
results.append(f"step_order={self.step_order}")
if self.step_retry_number:
results.append(f"step_retry_number={self.step_retry_number}")
if self.javascript_triggered:
results.append(f"javascript_triggered={self.javascript_triggered}")
if self.download_triggered is not None:
results.append(f"download_triggered={self.download_triggered}")
if self.interacted_with_sibling is not None:
results.append(f"interacted_with_sibling={self.interacted_with_sibling}")
if self.interacted_with_parent is not None:
results.append(f"interacted_with_parent={self.interacted_with_parent}")
return ", ".join(results) + ")"
def __repr__(self) -> str: def __repr__(self) -> str:
return self.__str__() return self.__str__()

View file

@ -183,7 +183,7 @@ class BrowserState:
await self._close_all_other_pages() await self._close_all_other_pages()
LOG.info("A new page is created") LOG.info("A new page is created")
if url: if url:
LOG.info(f"Navigating page to {url} and waiting for 3 seconds") LOG.info(f"Navigating page to {url} and waiting for 5 seconds")
try: try:
start_time = time.time() start_time = time.time()
await self.page.goto(url, timeout=settings.BROWSER_LOADING_TIMEOUT_MS) await self.page.goto(url, timeout=settings.BROWSER_LOADING_TIMEOUT_MS)
@ -193,6 +193,7 @@ class BrowserState:
loading_time=end_time - start_time, loading_time=end_time - start_time,
url=url, url=url,
) )
await asyncio.sleep(5)
except Error as playright_error: except Error as playright_error:
LOG.exception(f"Error while navigating to url: {str(playright_error)}") LOG.exception(f"Error while navigating to url: {str(playright_error)}")
raise FailedToNavigateToUrl(url=url, error_message=str(playright_error)) raise FailedToNavigateToUrl(url=url, error_message=str(playright_error))