LucidtechAI · augustak · Jun 27, 2024 · Jun 27, 2024 · Jun 27, 2024
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -1,5 +1,9 @@
 # Changelog
 
+## Version 13.3.0 - 2024-06-27
+
+- Added `workflows execute-all` which starts an execution on all documents in a dataset
+
 ## Version 13.2.2 - 2024-06-13
 
 - Bugfix `models update-training` now works as intended when specifying `--deployment-environment-id`

diff --git a/lascli/__version__.py b/lascli/__version__.py
@@ -7,4 +7,4 @@
 __maintainer_email__ = 'magnus@lucidtech.ai'
 __title__ = 'lucidtech-las-cli'
 __url__ = 'https://github.com/LucidtechAI/las-cli'
-__version__ = '13.2.2'
+__version__ = '13.3.0'
diff --git a/lascli/parser/workflows.py b/lascli/parser/workflows.py
@@ -3,6 +3,7 @@
 import pathlib
 import textwrap
 from argparse import RawTextHelpFormatter
+from functools import partial
 
 import dateparser
 from las import Client
@@ -32,6 +33,27 @@ def execute_workflow(las_client: Client, workflow_id, path):
     return las_client.execute_workflow(workflow_id, content)
 
 
+def execute_all_workflow(las_client: Client, workflow_id, dataset_id):
+    list_fn = partial(las_client.list_documents, dataset_id=dataset_id)
+    list_response = list_fn()
+    documents = list_response['documents']
+    while next_token := list_response['nextToken']:
+        list_response = list_fn(next_token=next_token)
+        documents.extend(list_response['documents'])
+
+    executions = []
+    for i, document in enumerate(documents):
+        content = {'documentId': document['documentId'], 'source': 'CLI', 'initialSleepInSeconds': i * 4}
+        if originalFilePath := document.get('metadata', {}).get('originalFilePath'):
+            file_path = pathlib.Path(originalFilePath)
+            content['title'] = file_path.name
+        execution = las_client.execute_workflow(workflow_id, content)
+        print(json.dumps(execution, indent=2))
+        executions.append(execution)
+
+    return f'Started {len(executions)} executions'
+
+
 def list_workflow_executions(las_client: Client, workflow_id, **optional_args):
     return las_client.list_workflow_executions(workflow_id, **optional_args)
 
@@ -196,6 +218,11 @@ def create_workflows_parser(subparsers):
     execute_workflow_parser.add_argument('path', help='path to json-file with input to the first state of the workflow')
     execute_workflow_parser.set_defaults(cmd=execute_workflow)
 
+    execute_workflow_parser = subparsers.add_parser('execute-all')
+    execute_workflow_parser.add_argument('workflow_id')
+    execute_workflow_parser.add_argument('dataset_id', help='Start execution on all documents in dataset')
+    execute_workflow_parser.set_defaults(cmd=execute_all_workflow)
+
     list_executions_parser = subparsers.add_parser('list-executions')
     list_executions_parser.add_argument('workflow_id')
     list_executions_parser.add_argument('--status', '-s', nargs='+', help='Only return those with the given status')