From a1b2dd4b08752547b22dd3f0a85723f9e59e349c Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 31 May 2024 15:58:36 +0000
Subject: [PATCH 01/42] initial work on dicom query/pull interface

---
 common/types.py                               |  12 +-
 webgui.py                                     |  19 +-
 webinterface/common.py                        |  11 +-
 webinterface/dashboards.py                    |  59 -----
 webinterface/dashboards/__init__.py           |   7 +
 webinterface/dashboards/common.py             |   7 +
 webinterface/dashboards/query.py              |  77 ++++++
 webinterface/dashboards/simple.py             |  32 +++
 webinterface/modules.py                       |   6 +-
 webinterface/query.py                         | 236 ++++++++++++++++++
 webinterface/queue.py                         |   2 -
 webinterface/rules.py                         |   4 -
 webinterface/targets.py                       |   2 -
 .../templates/dashboards/dashboards.html      |   1 +
 webinterface/templates/dashboards/query.html  | 117 +++++++++
 webinterface/users.py                         |   5 +-
 16 files changed, 508 insertions(+), 89 deletions(-)
 delete mode 100644 webinterface/dashboards.py
 create mode 100644 webinterface/dashboards/__init__.py
 create mode 100644 webinterface/dashboards/common.py
 create mode 100644 webinterface/dashboards/query.py
 create mode 100644 webinterface/dashboards/simple.py
 create mode 100644 webinterface/query.py
 create mode 100644 webinterface/templates/dashboards/query.html

diff --git a/common/types.py b/common/types.py
index 33e89511..9558db6c 100755
--- a/common/types.py
+++ b/common/types.py
@@ -178,6 +178,16 @@ class DicomReceiverConfig(BaseModel):
     additional_tags: Dict[str,str] = {}
     
 
+class DicomNode(BaseModel):
+    name: str
+    ip: str
+    port: int
+    aet_target: str
+    aet_source: Optional[str] = ""
+
+class DicomRetrieveConfig(BaseModel):
+    dicom_nodes: List[DicomNode] = []
+
 class Config(BaseModel, Compat):
     appliance_name: str
     port: int
@@ -220,7 +230,7 @@ class Config(BaseModel, Compat):
     email_notification_from: str = "mercure@mercure.mercure"
     support_root_modules: Optional[bool] = False
     webhook_certificate_location: Optional[str] = None
-
+    dicom_retrieve: DicomRetrieveConfig = DicomRetrieveConfig()
 
 class TaskInfo(BaseModel, Compat):
     action: Literal["route", "both", "process", "discard", "notification"]
diff --git a/webgui.py b/webgui.py
index 911df1de..41ff981e 100755
--- a/webgui.py
+++ b/webgui.py
@@ -295,7 +295,7 @@ async def show_log(request) -> Response:
     template = "logs.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
+        
         "page": "logs",
         "service_logs": service_logs,
         "log_id": requested_service,
@@ -307,7 +307,6 @@ async def show_log(request) -> Response:
         "end_time_available": runtime == "systemd",
         "start_time_available": runtime in ("docker", "systemd"),
     }
-    context.update(get_user_information(request))
     return templates.TemplateResponse(template, context)
 
 
@@ -330,14 +329,13 @@ async def configuration(request) -> Response:
     runtime = helper.get_runner()
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
+        
         "page": "configuration",
         "config": config.mercure,
         "os_string": os_string,
         "config_edited": config_edited,
         "runtime": runtime,
     }
-    context.update(get_user_information(request))
     return templates.TemplateResponse(template, context)
 
 
@@ -363,11 +361,10 @@ async def configuration_edit(request) -> Response:
     template = "configuration_edit.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
+        
         "page": "configuration",
         "config_content": config_content,
     }
-    context.update(get_user_information(request))
     return templates.TemplateResponse(template, context)
 
 
@@ -411,7 +408,7 @@ async def login(request) -> Response:
     template = "login.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
+        
         "appliance_name": config.mercure.get("appliance_name", "master"),
     }
     return templates.TemplateResponse(template, context)
@@ -599,7 +596,7 @@ async def login_post(request) -> Response:
         context = {
             "request": request,
             "invalid_password": 1,
-            "mercure_version": mercure_defs.VERSION,
+            
             "appliance_name": config.mercure.get("appliance_name", "mercure Router"),
         }
         return templates.TemplateResponse(template, context)
@@ -627,14 +624,13 @@ async def settings_edit(request) -> Response:
     template = "users_edit.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
+        
         "page": "settings",
         "edituser": own_name,
         "edituser_info": users.users_list[own_name],
         "own_settings": "True",
         "change_password": users.users_list[own_name].get("change_password", "False"),
     }
-    context.update(get_user_information(request))
     return templates.TemplateResponse(template, context)
 
 
@@ -710,7 +706,7 @@ async def homepage(request) -> Response:
     template = "index.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
+        
         "page": "homepage",
         "used_space": used_space,
         "free_space": free_space,
@@ -718,7 +714,6 @@ async def homepage(request) -> Response:
         "service_status": service_status,
         "runtime": runtime,
     }
-    context.update(get_user_information(request))
     return templates.TemplateResponse(template, context)
 
 
diff --git a/webinterface/common.py b/webinterface/common.py
index a870dd35..60e65adb 100755
--- a/webinterface/common.py
+++ b/webinterface/common.py
@@ -7,14 +7,18 @@
 # Standard python includes
 from typing import Optional, Tuple
 import asyncio
+from redis import Redis
+from rq import Queue, Connection
 
 # Starlette-related includes
 from starlette.templating import Jinja2Templates
 
+from common.constants import mercure_defs
 
-templates = Jinja2Templates(directory="webinterface/templates")
 
 
+worker_queue = Queue(connection=Redis())
+
 def get_user_information(request) -> dict:
     """Returns dictionary of values that should always be passed to the templates when the user is logged in."""
     return {
@@ -23,6 +27,11 @@ def get_user_information(request) -> dict:
         "is_admin": request.user.is_admin if request.user.is_authenticated else False,
     }
 
+def get_mercure_version(request) -> dict:
+    return { "mercure_version": mercure_defs.VERSION }
+
+templates = Jinja2Templates(directory="webinterface/templates", context_processors=[get_user_information, get_mercure_version])
+
 
 async def async_run(cmd, **params) -> Tuple[Optional[int], bytes, bytes]:
     """Executes the given command in a way compatible with ayncio."""
diff --git a/webinterface/dashboards.py b/webinterface/dashboards.py
deleted file mode 100644
index d441f192..00000000
--- a/webinterface/dashboards.py
+++ /dev/null
@@ -1,59 +0,0 @@
-"""
-test.py
-========
-Test page for querying the bookkeeper database from the webgui.
-"""
-
-# Standard python includes
-import daiquiri
-
-# Starlette-related includes
-from starlette.applications import Starlette
-from starlette.authentication import requires
-
-# App-specific includes
-from common.constants import mercure_defs
-from webinterface.common import get_user_information
-from webinterface.common import templates
-import common.config as config
-from starlette.responses import RedirectResponse
-from decoRouter import Router as decoRouter
-router = decoRouter()
-
-logger = config.get_logger()
-
-###################################################################################
-## Test endpoints
-###################################################################################
-
-@router.get("/")
-async def index(request):
-    return RedirectResponse(url="tests")
-
-
-@router.get("/tasks")
-@requires("authenticated", redirect="login")
-async def tasks(request):
-    template = "dashboards/tasks.html"
-    context = {
-        "request": request,
-        "mercure_version": mercure_defs.VERSION,
-        "page": "tasks",
-    }
-    context.update(get_user_information(request))
-    return templates.TemplateResponse(template, context)
-
-
-@router.get("/tests")
-@requires(["authenticated", "admin"], redirect="login")
-async def tests(request):
-    template = "dashboards/tests.html"
-    context = {
-        "request": request,
-        "mercure_version": mercure_defs.VERSION,
-        "page": "tests",
-    }
-    context.update(get_user_information(request))
-    return templates.TemplateResponse(template, context)
-
-dashboards_app = Starlette(routes=router)
\ No newline at end of file
diff --git a/webinterface/dashboards/__init__.py b/webinterface/dashboards/__init__.py
new file mode 100644
index 00000000..7fb55b79
--- /dev/null
+++ b/webinterface/dashboards/__init__.py
@@ -0,0 +1,7 @@
+from .common import router
+from . import query, simple
+from starlette.applications import Starlette
+
+
+
+dashboards_app = Starlette(routes=router)
\ No newline at end of file
diff --git a/webinterface/dashboards/common.py b/webinterface/dashboards/common.py
new file mode 100644
index 00000000..f4eae329
--- /dev/null
+++ b/webinterface/dashboards/common.py
@@ -0,0 +1,7 @@
+from decoRouter import Router as decoRouter
+from starlette.responses import RedirectResponse
+
+router = decoRouter()
+@router.get("/")
+async def index(request):
+    return RedirectResponse(url="tests")
\ No newline at end of file
diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
new file mode 100644
index 00000000..e27f0740
--- /dev/null
+++ b/webinterface/dashboards/query.py
@@ -0,0 +1,77 @@
+
+from webinterface.query import SimpleDicomClient
+# Standard python includes
+from datetime import datetime
+
+# Starlette-related includes
+from starlette.authentication import requires
+
+# App-specific includes
+from common.constants import mercure_defs
+from webinterface.common import templates
+import common.config as config
+from starlette.responses import PlainTextResponse, JSONResponse
+from webinterface.common import worker_queue
+from rq import get_current_job
+
+from .common import router
+logger = config.get_logger()
+
+def test_job(*,accession, node):
+    config.read_config()
+    c = SimpleDicomClient(node.ip, node.port, node.aet_target, config.mercure.incoming_folder)
+    for identifier in c.getscu(accession):
+        job = get_current_job()
+        job.meta['failed'] = identifier.NumberOfFailedSuboperations
+        job.meta['remaining'] = identifier.NumberOfRemainingSuboperations
+        job.meta['completed'] = identifier.NumberOfCompletedSuboperations
+        job.save_meta()
+    return "Complete"
+
+@router.post("/query")
+@requires(["authenticated", "admin"], redirect="login")
+async def query_post(request):
+    form = await request.form()
+
+    for n in config.mercure.dicom_retrieve.dicom_nodes:
+        if n.name == form.get("dicom_node"):
+            node = n
+            break
+    
+    worker_queue.enqueue_call(test_job, kwargs=dict(accession=form.get("accession"), node=node), timeout='10m', result_ttl=-1)
+    return PlainTextResponse()
+
+@router.get("/query/jobs")
+@requires(["authenticated", "admin"], redirect="login")
+async def query_jobs(request):
+    registries = [
+        worker_queue.started_job_registry,  # Returns StartedJobRegistry
+        worker_queue.deferred_job_registry,   # Returns DeferredJobRegistry
+        worker_queue.finished_job_registry,  # Returns FinishedJobRegistry
+        worker_queue.failed_job_registry,  # Returns FailedJobRegistry 
+        worker_queue.scheduled_job_registry,  # Returns ScheduledJobRegistry
+    ]
+    job_info = []
+    for r in registries:
+        for j_id in r.get_job_ids():
+            job = worker_queue.fetch_job(j_id)
+            job_info.append(dict(id=j_id, 
+                                 status=job.get_status(), 
+                                 parameters=dict(accession=job.kwargs.get('accession','')), 
+                                 enqueued_at=1000*datetime.timestamp(job.enqueued_at), 
+                                 result=job.result, 
+                                 meta=job.meta))
+    return JSONResponse(dict(data=job_info))
+    # return PlainTextResponse(",".join([str(j) for j in all_jobs]))
+
+@router.get("/query")
+@requires(["authenticated", "admin"], redirect="login")
+async def query(request):
+    template = "dashboards/query.html"
+    context = {
+        "request": request,
+        
+        "dicom_nodes": config.mercure.dicom_retrieve.dicom_nodes,
+        "page": "query",
+    }
+    return templates.TemplateResponse(template, context)
\ No newline at end of file
diff --git a/webinterface/dashboards/simple.py b/webinterface/dashboards/simple.py
new file mode 100644
index 00000000..c1a2ad47
--- /dev/null
+++ b/webinterface/dashboards/simple.py
@@ -0,0 +1,32 @@
+from .common import router
+from starlette.authentication import requires
+
+# App-specific includes
+from common.constants import mercure_defs
+from webinterface.common import get_user_information, templates
+import common.config as config
+logger = config.get_logger()
+from .common import router
+
+@router.get("/tasks")
+@requires("authenticated", redirect="login")
+async def tasks(request):
+    template = "dashboards/tasks.html"
+    context = {
+        "request": request,
+        
+        "page": "tasks",
+    }
+    return templates.TemplateResponse(template, context)
+
+
+@router.get("/tests")
+@requires(["authenticated", "admin"], redirect="login")
+async def tests(request):
+    template = "dashboards/tests.html"
+    context = {
+        "request": request,
+        
+        "page": "tests",
+    }
+    return templates.TemplateResponse(template, context)
\ No newline at end of file
diff --git a/webinterface/modules.py b/webinterface/modules.py
index 34047fc8..fdf89644 100755
--- a/webinterface/modules.py
+++ b/webinterface/modules.py
@@ -101,12 +101,11 @@ async def show_modules(request):
     template = "modules.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
+        
         "page": "modules",
         "modules": config.mercure.modules,
         "used_modules": used_modules,
     }
-    context.update(get_user_information(request))
     return templates.TemplateResponse(template, context)
 
 
@@ -204,7 +203,7 @@ async def edit_module(request):
     template = "modules_edit.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
+        
         "page": "modules",
         "module": config.mercure.modules[module],
         "module_name": module,
@@ -212,7 +211,6 @@ async def edit_module(request):
         "runtime": runtime,
         "support_root_modules": config.mercure.support_root_modules,
     }
-    context.update(get_user_information(request))
     return templates.TemplateResponse(template, context)
 
 
diff --git a/webinterface/query.py b/webinterface/query.py
new file mode 100644
index 00000000..fa1077e2
--- /dev/null
+++ b/webinterface/query.py
@@ -0,0 +1,236 @@
+import os
+import re
+from pynetdicom import (
+        AE,
+        QueryRetrievePresentationContexts, BasicWorklistManagementPresentationContexts, UnifiedProcedurePresentationContexts,
+        build_role,
+        evt,
+        StoragePresentationContexts
+    )
+from pynetdicom.sop_class import StudyRootQueryRetrieveInformationModelFind
+from pynetdicom.apps.common import create_dataset
+from pynetdicom._globals import DEFAULT_MAX_LENGTH
+from pynetdicom.pdu_primitives import SOPClassExtendedNegotiation
+from pynetdicom.sop_class import (
+    PatientRootQueryRetrieveInformationModelGet,
+    StudyRootQueryRetrieveInformationModelGet,
+    PatientStudyOnlyQueryRetrieveInformationModelGet,
+    EncapsulatedSTLStorage,
+    EncapsulatedOBJStorage,
+    EncapsulatedMTLStorage,
+)
+from pydicom.uid import DeflatedExplicitVRLittleEndian
+from pydicom import Dataset
+import sys
+import subprocess
+
+
+class DicomClientCouldNotAssociate(Exception):
+    pass
+
+class DicomClientCouldNotFind(Exception):
+    pass
+
+class DicomClientBadStatus(Exception):
+    pass
+
+SOP_CLASS_PREFIXES = {
+    "1.2.840.10008.5.1.4.1.1.2": ("CT", "CT Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.2.1": ("CTE", "Enhanced CT Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.4": ("MR", "MR Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.4.1": ("MRE", "Enhanced MR Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.128": ("PT", "Positron Emission Tomography Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.130": ("PTE", "Enhanced PET Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.481.1": ("RI", "RT Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.481.2": ("RD", "RT Dose Storage"),
+    "1.2.840.10008.5.1.4.1.1.481.5": ("RP", "RT Plan Storage"),
+    "1.2.840.10008.5.1.4.1.1.481.3": ("RS", "RT Structure Set Storage"),
+    "1.2.840.10008.5.1.4.1.1.1": ("CR", "Computed Radiography Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.6.1": ("US", "Ultrasound Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.6.2": ("USE", "Enhanced US Volume Storage"),
+    "1.2.840.10008.5.1.4.1.1.12.1": ("XA", "X-Ray Angiographic Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.12.1.1": ("XAE", "Enhanced XA Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.20": ("NM", "Nuclear Medicine Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.7": ("SC", "Secondary Capture Image Storage"),
+}
+class SimpleDicomClient():
+    host: str
+    port: int
+    called_aet: str
+    output_dir: str
+    def __init__(self, host, port, called_aet, out_dir):
+        self.host = host
+        self.port = port
+        self.called_aet = called_aet
+        self.output_dir = out_dir
+    
+    def handle_store(self, event):
+        try:
+            ds = event.dataset
+            # Remove any Group 0x0002 elements that may have been included
+            ds = ds[0x00030000:]
+        except Exception as exc:
+            print(exc)
+            return 0x210
+        try:
+            sop_class = ds.SOPClassUID
+            # sanitize filename by replacing all illegal characters with underscores
+            sop_instance = re.sub(r"[^\d.]", "_", ds.SOPInstanceUID)
+        except Exception as exc:
+            print(
+                "Unable to decode the received dataset or missing 'SOP Class "
+                "UID' and/or 'SOP Instance UID' elements"
+            )
+            print(exc)
+            # Unable to decode dataset
+            return 0xC210
+
+        try:
+            # Get the elements we need
+            mode_prefix = SOP_CLASS_PREFIXES[sop_class][0]
+        except KeyError:
+            mode_prefix = "UN"
+
+        filename = f"{self.output_dir}/{mode_prefix}.{sop_instance}"
+        print(f"Storing DICOM file: {filename}")
+
+        status_ds = Dataset()
+        status_ds.Status = 0x0000
+        try:
+            if event.context.transfer_syntax == DeflatedExplicitVRLittleEndian:
+                # Workaround for pydicom issue #1086
+                with open(filename, "wb") as f:
+                    f.write(event.encoded_dataset())
+            else:
+                # We use `write_like_original=False` to ensure that a compliant
+                #   File Meta Information Header is written
+                ds.save_as(filename, write_like_original=False)
+
+            status_ds.Status = 0x0000  # Success
+        except OSError as exc:
+            print("Could not write file to specified directory:")
+            print(f"    {os.path.dirname(filename)}")
+            print(exc)
+            # Failed - Out of Resources - OSError
+            status_ds.Status = 0xA700
+        except Exception as exc:
+            print("Could not write file to specified directory:")
+            print(f"    {os.path.dirname(filename)}")
+            print(exc)
+            # Failed - Out of Resources - Miscellaneous error
+            status_ds.Status = 0xA701
+
+        subprocess.run(["/opt/mercure/app/bin/ubuntu22.04/getdcmtags", filename, self.called_aet, "MERCURE"]) 
+        return status_ds
+
+
+    def getscu(self, accession_number):
+        # Exclude these SOP Classes
+        _exclusion = [
+            EncapsulatedSTLStorage,
+            EncapsulatedOBJStorage,
+            EncapsulatedMTLStorage,
+        ]
+        store_contexts = [
+            cx for cx in StoragePresentationContexts if cx.abstract_syntax not in _exclusion
+        ]
+        ae = AE(ae_title="MERCURE")
+        # Create application entity
+        # Binding to port 0 lets the OS pick an available port
+        ae.acse_timeout = 30
+        ae.dimse_timeout = 30
+        ae.network_timeout = 30
+        ae.add_requested_context(PatientRootQueryRetrieveInformationModelGet)
+        ae.add_requested_context(StudyRootQueryRetrieveInformationModelGet)
+        ae.add_requested_context(PatientStudyOnlyQueryRetrieveInformationModelGet)
+        ext_neg = []
+        for cx in store_contexts:
+            ae.add_requested_context(cx.abstract_syntax)
+            # Add SCP/SCU Role Selection Negotiation to the extended negotiation
+            # We want to act as a Storage SCP
+            ext_neg.append(build_role(cx.abstract_syntax, scp_role=True))
+        query_model = StudyRootQueryRetrieveInformationModelGet
+        assoc = ae.associate(
+                self.host, self.port,
+                ae_title=self.called_aet,
+                ext_neg=ext_neg,
+                evt_handlers=[(evt.EVT_C_STORE, self.handle_store, [])],
+                max_pdu=0,
+            )
+        if not assoc.is_established:
+            raise DicomClientCouldNotAssociate()
+            # Send query
+
+        ds = Dataset()
+        ds.QueryRetrieveLevel = 'STUDY'
+        ds.AccessionNumber = accession_number
+
+        responses = assoc.send_c_get(ds, query_model)
+        success = False
+        for status, rsp_identifier in responses:
+            # If `status.Status` is one of the 'Pending' statuses then
+            #   `rsp_identifier` is the C-GET response's Identifier dataset
+            if not status:
+                raise DicomClientBadStatus()
+            
+            if status.Status in [0xFF00, 0xFF01]:
+                yield status
+                success = True
+        if not success:
+            raise DicomClientCouldNotFind()
+
+        assoc.release()
+
+    def findscu(self,accession_number):
+        # Create application entity
+        ae = AE(ae_title=calling_aet)
+
+        # Add a requested presentation context
+        # ae.add_requested_context(StudyRootQueryRetrieveInformationModelFind)
+        ae.requested_contexts = QueryRetrievePresentationContexts
+                # + BasicWorklistManagementPresentationContexts
+                # + UnifiedProcedurePresentationContexts )
+
+        # Associate with the peer AE
+        assoc = ae.associate(self.host, self.port, ae_title=self.called_aet, max_pdu=0, ext_neg=[])
+
+        ds = Dataset()
+        ds.QueryRetrieveLevel = 'STUDY'
+        ds.AccessionNumber = accession_number
+        if not assoc.is_established:
+            raise DicomClientCouldNotAssociate()
+
+        try:
+            responses = assoc.send_c_find(
+                ds,
+                StudyRootQueryRetrieveInformationModelFind
+            )
+
+            for (status, identifier) in responses:
+                if not status:
+                    print('Connection timed out, was aborted or received invalid response')
+                    break
+
+                if status.Status in [0xFF00, 0xFF01]:
+                    # print('C-FIND query status: 0x{0:04x}'.format(status.Status))
+                    return identifier
+                # elif status.Status == 0x0000:
+                #     print("Success")
+                #     break
+            raise DicomClientCouldNotFind()
+        finally:
+            assoc.release()
+
+if __name__ == "__main__":
+    # Replace these variables with your actual values
+    remote_host = sys.argv[1]
+    remote_port = int(sys.argv[2])
+    calling_aet = sys.argv[3]
+    called_aet = sys.argv[4]
+    accession_number = sys.argv[5]
+
+    print(f"{remote_host=} {remote_port=} {calling_aet=} {called_aet=} {accession_number=}")
+    c = SimpleDicomClient(remote_host, remote_port, called_aet, "/tmp/test-move")
+    # study_uid = c.get_study_uid(accession_number)
+    # print(study_uid)
+    c.getscu(accession_number)
\ No newline at end of file
diff --git a/webinterface/queue.py b/webinterface/queue.py
index b104134c..de92bcd1 100755
--- a/webinterface/queue.py
+++ b/webinterface/queue.py
@@ -57,12 +57,10 @@ async def show_queues(request):
     template = "queue.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
         "page": "queue",
         "processing_suspended": processing_suspended,
         "routing_suspended": routing_suspended,
     }
-    context.update(get_user_information(request))
     return templates.TemplateResponse(template, context)
 
 
diff --git a/webinterface/rules.py b/webinterface/rules.py
index 2d76bbfd..39c011b5 100755
--- a/webinterface/rules.py
+++ b/webinterface/rules.py
@@ -47,11 +47,9 @@ async def show_rules(request) -> Response:
     template = "rules.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
         "page": "rules",
         "rules": config.mercure.rules,
     }
-    context.update(get_user_information(request))
     return templates.TemplateResponse(template, context)
 
 
@@ -112,7 +110,6 @@ async def rules_edit(request) -> Response:
 
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
         "page": "rules",
         "rules": config.mercure.rules,
         "targets": config.mercure.targets,
@@ -123,7 +120,6 @@ async def rules_edit(request) -> Response:
         "processing_settings": settings_string,
         "process_runner": config.mercure.process_runner
     }
-    context.update(get_user_information(request))
 
     template = "rules_edit.html"
     return templates.TemplateResponse(template, context)
diff --git a/webinterface/targets.py b/webinterface/targets.py
index bf78ceb6..9dddb525 100755
--- a/webinterface/targets.py
+++ b/webinterface/targets.py
@@ -50,7 +50,6 @@ async def show_targets(request) -> Response:
     template = "targets.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
         "page": "targets",
         "targets": config.mercure.targets,
         "used_targets": used_targets,
@@ -104,7 +103,6 @@ async def targets_edit(request) -> Response:
     template = "targets_edit.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
         "page": "targets",
         "targets": config.mercure.targets,
         "edittarget": edittarget,
diff --git a/webinterface/templates/dashboards/dashboards.html b/webinterface/templates/dashboards/dashboards.html
index 2cb4c137..afe990b0 100644
--- a/webinterface/templates/dashboards/dashboards.html
+++ b/webinterface/templates/dashboards/dashboards.html
@@ -7,6 +7,7 @@
     <ul>
       <li class="{% if page == 'tests' %}is-active{% endif %}"><a href="tests">Self-test</a></li>
       <li class="{% if page == 'tasks' %}is-active{% endif %}"><a href="tasks">Tasks</a></li>
+      <li class="{% if page == 'query' %}is-active{% endif %}"><a href="query">Query</a></li>
     </ul>
   </div>
   </div>
diff --git a/webinterface/templates/dashboards/query.html b/webinterface/templates/dashboards/query.html
new file mode 100644
index 00000000..48756c04
--- /dev/null
+++ b/webinterface/templates/dashboards/query.html
@@ -0,0 +1,117 @@
+{% extends "dashboards/dashboards.html" %}
+
+{% block title %}Query{% endblock %}
+
+{% block extra_head %}
+    <script type="text/javascript" src="{{ url_for('static', path='DataTables/datatables.min.js') }}"></script>
+    <link rel="stylesheet" type="text/css" href="{{ url_for('static', path='DataTables/datatables.min.css') }}"/>  
+{% endblock %}
+
+{% block dashboard_content %}
+<main role="main">
+    <h1 class="title">DICOM Query</h1>
+    <div class="container">
+        <form class="box" id="form" hx-post="query" hx-target="#query_result" hx-swap="innerHTML">
+            <div class="field is-horizontal">
+              <div class="field-label is-normal">
+                <label class="label">Accession</label>
+              </div>
+              <div class="field-body">
+                <div class="field">
+                  <div class="control is-expanded">
+                    <div class="control">
+                        <input name="accession" class="input" type="text" placeholder="00000" value="">
+                      </div>
+                  </div>
+                </div>
+              </div>
+            </div>
+            <div class="field is-horizontal">
+              <div class="field-label is-normal">
+                <label class="label">Dicom Node</label>
+              </div>
+              <div class="field-body">
+                <div class="field">
+                  <div class="control is-expanded">
+                    <div class="select">
+                        <select name="dicom_node">
+                          {% for node in dicom_nodes %}
+                          <option>{{ node.name }}</option>
+                          {% endfor %}
+                        </select>
+                      </div>
+                  </div>
+                </div>
+              </div>
+            </div>
+
+            <div class="field is-horizontal">
+              <div class="field-label">
+                <!-- Left empty for spacing -->
+              </div>
+              <div class="field-body">
+                <div class="field">
+                  <div class="control">
+                    <button type="submit" class="button is-primary">
+                      Query
+                    </button>
+                  </div>
+                </div>
+              </div>
+            </div>
+          </div> 
+          </form>
+          <div id="query_result"></div>
+        <div class="columns">
+
+        <div class="column">
+            <table class="table is-narrow is-hoverable is-fullwidth jobtable" id="casetable">
+                <thead>
+                    <tr>
+                        <th>id</th>
+                        <th>status</th>
+                        <th>enqueued_at</th>
+                        <th>accession</th>
+                        <th>result</th>
+                        <th>progress</th>
+                    </tr>
+                </thead>
+                <tbody>
+                </tbody>
+            </table>
+            </div>
+            </div>
+    </div>
+</main>
+<script>
+$(document).ready(function () {      
+    $("#form").on('htmx:afterOnLoad', (event) => {
+        datatable.ajax.reload();
+});
+    window.datatable = $('#casetable').DataTable({           
+        dom: "<'row browsertoolbar align-items-end'<'col-sm-12 col-md-7 browserbuttons'B><'col-sm-12 col-md-2'><'col-sm-12 col-md-3'f>>" + "<'row'<'col-sm-12'tr>>" + "<'row browserfooterbar'<'col-sm-12 col-md-5'l><'col-sm-12 col-md-7'p>>",
+        ajax: "query/jobs",
+        deferRender: true,
+        columns: [
+            { data: 'id' },
+            { data: 'status' },
+            { data: 'enqueued_at', render: data => `<span style="display:none;">${data}</span>`+new Date(data).toLocaleString("en-US")},
+            { data: 'parameters', render: data => data["accession"] || ""},
+            { data: 'result' },
+            { data: 'meta', render: data => data["completed"]?`${data["completed"]}/${data["remaining"]+data["completed"]}`:"" },
+        ],
+        select: {
+            style: 'os'
+        },
+        language: {
+            "emptyTable": "No messages available on server."
+        },
+        // filter: true,
+        buttons: [],
+        order: [[2, 'desc']],
+        initComplete: function() {             
+        }
+    });
+});
+</script>
+{% endblock %}
\ No newline at end of file
diff --git a/webinterface/users.py b/webinterface/users.py
index 1d70f57f..f7b7276b 100755
--- a/webinterface/users.py
+++ b/webinterface/users.py
@@ -187,8 +187,7 @@ async def show_users(request) -> Response:
         return PlainTextResponse("Configuration is being updated. Try again in a minute.")
 
     template = "users.html"
-    context = {"request": request, "mercure_version": mercure_defs.VERSION, "page": "users", "users": users_list}
-    context.update(get_user_information(request))
+    context = {"request": request,  "page": "users", "users": users_list}
     return templates.TemplateResponse(template, context)
 
 
@@ -237,12 +236,10 @@ async def users_edit(request) -> Response:
     template = "users_edit.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
         "page": "users",
         "edituser": edituser,
         "edituser_info": users_list[edituser],
     }
-    context.update(get_user_information(request))
     return templates.TemplateResponse(template, context)
 
 

From 3928935b6812a8d3dc3037362dff4a1eb15c6770 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 31 May 2024 22:41:35 +0000
Subject: [PATCH 02/42] beginner support for batch process

---
 requirements.in                               |  10 +-
 requirements.txt                              |  24 ++-
 webinterface/common.py                        |   7 +-
 webinterface/dashboards/query.py              | 146 ++++++++++++++++--
 webinterface/templates/dashboards/query.html  |  36 ++++-
 .../dashboards/query_job_fragment.html        |  29 ++++
 6 files changed, 227 insertions(+), 25 deletions(-)
 create mode 100644 webinterface/templates/dashboards/query_job_fragment.html

diff --git a/requirements.in b/requirements.in
index bbfe31af..ca789b3e 100644
--- a/requirements.in
+++ b/requirements.in
@@ -57,8 +57,10 @@ pillow >= 10.0.1
 dicomweb-client
 boto3
 freezegun
-certifi>=2023.07.22
-future>=0.18.3
-lxml>=4.9.1
+certifi >= 2023.07.22
+future >= 0.18.3
+lxml >= 4.9.1
 pyxnat
-urllib3>=1.26.18
\ No newline at end of file
+urllib3 >= 1.26.18
+rq ~= 1.16.2
+rq-scheduler ~= 0.13.1
\ No newline at end of file
diff --git a/requirements.txt b/requirements.txt
index c1c269d9..66a94595 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -2,7 +2,7 @@
 # This file is autogenerated by pip-compile with Python 3.10
 # by the following command:
 #
-#    pip-compile requirements.in
+#    pip-compile
 #
 aiofiles==23.2.1
     # via -r requirements.in
@@ -25,6 +25,7 @@ async-timeout==4.0.3
     #   aiohttp
     #   aiopg
     #   asyncpg
+    #   redis
 asyncpg==0.29.0
     # via -r requirements.in
 attrs==23.2.0
@@ -40,11 +41,14 @@ botocore==1.34.40
 certifi==2024.2.2
     # via
     #   -r requirements.in
+    #   influxdb-client
     #   requests
 charset-normalizer==3.3.2
     # via requests
 click==8.1.7
-    # via uvicorn
+    # via
+    #   rq
+    #   uvicorn
 daiquiri==3.2.5.1
     # via -r requirements.in
 databases[aiopg]==0.8.0
@@ -86,10 +90,10 @@ idna==3.6
     #   yarl
 imagesize==1.4.1
     # via sphinx
+influxdb-client==1.38.0
+    # via -r requirements.in
 iniconfig==2.0.0
     # via pytest
-influxdb_client==1.38.0
-    # via -r requirements.in
 itsdangerous==2.1.2
     # via -r requirements.in
 jinja2==3.1.3
@@ -164,6 +168,7 @@ python-dateutil==2.8.2
     # via
     #   botocore
     #   freezegun
+    #   influxdb-client
 python-json-logger==2.0.7
     # via daiquiri
 python-multipart==0.0.9
@@ -172,6 +177,10 @@ python-nomad==2.0.0
     # via -r requirements.in
 pyxnat==1.6.2
     # via -r requirements.in
+reactivex==4.0.4
+    # via influxdb-client
+redis==5.0.4
+    # via rq
 requests==2.31.0
     # via
     #   dicomweb-client
@@ -181,6 +190,8 @@ requests==2.31.0
     #   sphinx
 retrying==1.3.4
     # via dicomweb-client
+rq==1.16.2
+    # via -r requirements.in
 s3transfer==0.10.0
     # via boto3
 six==1.16.0
@@ -244,11 +255,13 @@ typing-extensions==4.9.0
     #   asgiref
     #   mypy
     #   pydantic
+    #   reactivex
 urllib3==2.0.7
     # via
     #   -r requirements.in
     #   botocore
     #   docker
+    #   influxdb-client
     #   requests
     #   types-requests
 uvicorn==0.16.0
@@ -259,3 +272,6 @@ wheel==0.42.0
     # via -r requirements.in
 yarl==1.9.4
     # via aiohttp
+
+# The following packages are considered to be unsafe in a requirements file:
+# setuptools
diff --git a/webinterface/common.py b/webinterface/common.py
index 60e65adb..25a35efd 100755
--- a/webinterface/common.py
+++ b/webinterface/common.py
@@ -14,10 +14,11 @@
 from starlette.templating import Jinja2Templates
 
 from common.constants import mercure_defs
+from rq_scheduler import Scheduler
 
-
-
-worker_queue = Queue(connection=Redis())
+redis = Redis()
+worker_queue = Queue(connection=redis)
+worker_scheduler = Scheduler(queue=worker_queue, connection=worker_queue.connection) 
 
 def get_user_information(request) -> dict:
     """Returns dictionary of values that should always be passed to the templates when the user is logged in."""
diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
index e27f0740..8dd692de 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query.py
@@ -2,7 +2,7 @@
 from webinterface.query import SimpleDicomClient
 # Standard python includes
 from datetime import datetime
-
+import time, random
 # Starlette-related includes
 from starlette.authentication import requires
 
@@ -11,34 +11,139 @@
 from webinterface.common import templates
 import common.config as config
 from starlette.responses import PlainTextResponse, JSONResponse
-from webinterface.common import worker_queue
+from webinterface.common import worker_queue, redis
+from rq import Connection
 from rq import get_current_job
-
+from rq.job import Job
 from .common import router
 logger = config.get_logger()
 
-def test_job(*,accession, node):
+def query_job(*,accession, node):
     config.read_config()
     c = SimpleDicomClient(node.ip, node.port, node.aet_target, config.mercure.incoming_folder)
+    job = get_current_job()
+    job.meta["started"] = 1
+    job.save_meta()
     for identifier in c.getscu(accession):
-        job = get_current_job()
         job.meta['failed'] = identifier.NumberOfFailedSuboperations
         job.meta['remaining'] = identifier.NumberOfRemainingSuboperations
         job.meta['completed'] = identifier.NumberOfCompletedSuboperations
+        if not job.meta.get('total', False):
+            job.meta['total'] = identifier.NumberOfCompletedSuboperations + identifier.NumberOfRemainingSuboperations
+        job.meta["started"] += 1
         job.save_meta()
     return "Complete"
 
+def dummy_job(*,accession, node):
+    total_time = 3  # Total time for the job in seconds (1 minute)
+    update_interval = 1  # Interval between updates in seconds
+
+    start_time = time.monotonic()
+    job = get_current_job()
+    if job.meta.get('parent'):
+        job_parent = worker_queue.fetch_job(job.meta['parent'])
+    else:
+        job_parent = None
+    # failed = 0
+    remaining = total_time // update_interval
+    completed = 0
+    print(accession)
+    if job_parent:
+        job_parent.meta['started'] = job_parent.meta.get('started',0) + 1
+        job_parent.save_meta()
+
+    job.meta['started'] = 1
+    job.meta['total'] = remaining
+    job.meta['progress'] = f"0 / {job.meta['total']}"
+    job.save_meta()
+    while (time.monotonic() - start_time) < total_time:
+        time.sleep(update_interval)  # Sleep for the interval duration
+        remaining -= 1
+        completed += 1
+
+        # job.meta['failed'] = failed
+        job.meta['remaining'] = remaining
+        job.meta['completed'] = completed
+        job.meta['progress'] = f"{completed} / {job.meta['total']}"
+        print(job.meta['progress'])
+        job.save_meta()  # Save the updated meta data to the job
+    
+    if job_parent:
+        job_parent.meta['completed'] += 1
+        job_parent.meta['progress'] = f"{job_parent.meta['completed'] } / {job_parent.meta['total']}"
+
+        job_parent.save_meta()
+    return "Job complete"
+
+def batch_job(*, accessions, subjobs):
+    print(subjobs)
+    return "Batch complete"
+
+def monitor_job():
+    print("monitoring")
+
+@router.get("/query/job_info")
+@requires(["authenticated", "admin"], redirect="login")
+async def get_job_info(request):
+    job_id = request.query_params['id']
+    job = worker_queue.fetch_job(job_id)
+    if not job:
+        return JSONResponse({'error': 'Job not found'}, status_code=404)
+    
+    subjob_info = []
+    for job_id in job.kwargs.get('subjobs',[]):
+        subjob = worker_queue.fetch_job(job_id)
+        if subjob:
+            subjob_info.append({'id': subjob.get_id(),
+                                'ended_at': subjob.ended_at.isoformat().split('.')[0] if subjob.ended_at else "", 
+                                'created_at_dt':subjob.created_at,
+                                'accession': subjob.kwargs['accession'],
+                                'progress': subjob.meta.get('progress'),
+                                'status': subjob.get_status()})
+    subjob_info = sorted(subjob_info, key=lambda x:x['created_at_dt'])
+    return templates.TemplateResponse("dashboards/query_job_fragment.html", {"request":request,"subjob_info":subjob_info})
+
 @router.post("/query")
 @requires(["authenticated", "admin"], redirect="login")
-async def query_post(request):
+async def query_post_batch(request):
+    """
+    Starts a new query job for the given accession number and DICOM node.
+    """
     form = await request.form()
+    for n in config.mercure.dicom_retrieve.dicom_nodes:
+        if n.name == form.get("dicom_node"):
+            node = n
+            break
+    random_accessions = ["".join(random.choices([str(i) for i in range(10)], k=10)) for _ in range(5)]
+    jobs = []
+    with Connection(redis):
+        for accession in random_accessions:
+            job = Job.create(dummy_job, kwargs=dict(accession=accession, node=node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_batch",parent=None))
+            jobs.append(job)
+        full_job = Job.create(batch_job, kwargs=dict(accessions=random_accessions, subjobs=[j.id for j in jobs]), timeout=-1, result_ttl=-1, meta=dict(type="batch", started=0, completed=0, total=len(jobs)), depends_on=[j.id for j in jobs])
+        for j in jobs:
+            j.meta["parent"] = full_job.id
+
+    for j in jobs:
+        worker_queue.enqueue_job(j)
+    worker_queue.enqueue_job(full_job)
 
+    # worker_scheduler.schedule(scheduled_time=datetime.utcnow(), func=monitor_job, interval=10, repeat=10, result_ttl=-1)
+    return PlainTextResponse()
+
+@router.post("/query_single")
+@requires(["authenticated", "admin"], redirect="login")
+async def query_post(request):
+    """
+    Starts a new query job for the given accession number and DICOM node.
+    """
+    form = await request.form()
     for n in config.mercure.dicom_retrieve.dicom_nodes:
         if n.name == form.get("dicom_node"):
             node = n
             break
     
-    worker_queue.enqueue_call(test_job, kwargs=dict(accession=form.get("accession"), node=node), timeout='10m', result_ttl=-1)
+    worker_queue.enqueue_call(query_job, kwargs=dict(accession=form.get("accession"), node=node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_single"))
     return PlainTextResponse()
 
 @router.get("/query/jobs")
@@ -55,12 +160,33 @@ async def query_jobs(request):
     for r in registries:
         for j_id in r.get_job_ids():
             job = worker_queue.fetch_job(j_id)
-            job_info.append(dict(id=j_id, 
+            if job.meta.get('type') != 'batch':
+                continue
+            job_dict = dict(id=j_id, 
                                  status=job.get_status(), 
                                  parameters=dict(accession=job.kwargs.get('accession','')), 
-                                 enqueued_at=1000*datetime.timestamp(job.enqueued_at), 
+                                 created_at=1000*datetime.timestamp(job.created_at) if job.created_at else "",
+                                 enqueued_at=1000*datetime.timestamp(job.enqueued_at) if job.enqueued_at else "", 
                                  result=job.result, 
-                                 meta=job.meta))
+                                 meta=job.meta,
+                                 progress="")
+            # if job.meta.get('completed') and job.meta.get('remaining'):
+            #     job_dict["progress"] = f"{job.meta.get('completed')} / {job.meta.get('completed') + job.meta.get('remaining')}"
+            # if job.meta.get('type',None) == "batch":
+            n_started = job.meta.get('started',0)
+            n_completed = job.meta.get('completed',0)
+            n_total = job.meta.get('total',0)
+
+            if job_dict["status"] == "finished":
+                job_dict["progress"] = f"{n_total} / {n_total}"
+            elif job_dict["status"] in ("deferred","started"):
+                job_dict["progress"] = f"{n_completed} / {n_total}"
+                if 0 < n_started < n_total:
+                    job_dict["status"] = "running"
+                elif n_completed == n_total:
+                    job_dict["status"] = "finishing"
+
+            job_info.append(job_dict)
     return JSONResponse(dict(data=job_info))
     # return PlainTextResponse(",".join([str(j) for j in all_jobs]))
 
diff --git a/webinterface/templates/dashboards/query.html b/webinterface/templates/dashboards/query.html
index 48756c04..f595df46 100644
--- a/webinterface/templates/dashboards/query.html
+++ b/webinterface/templates/dashboards/query.html
@@ -68,9 +68,11 @@ <h1 class="title">DICOM Query</h1>
             <table class="table is-narrow is-hoverable is-fullwidth jobtable" id="casetable">
                 <thead>
                     <tr>
+                        <th></th>
                         <th>id</th>
+                        <th>type</th>
                         <th>status</th>
-                        <th>enqueued_at</th>
+                        <th>created_at</th>
                         <th>accession</th>
                         <th>result</th>
                         <th>progress</th>
@@ -93,14 +95,22 @@ <h1 class="title">DICOM Query</h1>
         ajax: "query/jobs",
         deferRender: true,
         columns: [
+            {
+                className: 'dt-control',
+                orderable: false,
+                data: null,
+                defaultContent: ''
+            },
             { data: 'id' },
+            { data: 'meta', render: data => data["type"]? data["type"]:"" },
             { data: 'status' },
-            { data: 'enqueued_at', render: data => `<span style="display:none;">${data}</span>`+new Date(data).toLocaleString("en-US")},
+            { data: 'created_at', render: data => `<span style="display:none;">${data || Date.now()  }</span>`+(data? new Date(data).toLocaleString("en-US"):"")},
             { data: 'parameters', render: data => data["accession"] || ""},
             { data: 'result' },
-            { data: 'meta', render: data => data["completed"]?`${data["completed"]}/${data["remaining"]+data["completed"]}`:"" },
+            { data: 'progress'},
         ],
         select: {
+            selector:'td:not(:first-child)',
             style: 'os'
         },
         language: {
@@ -108,10 +118,28 @@ <h1 class="title">DICOM Query</h1>
         },
         // filter: true,
         buttons: [],
-        order: [[2, 'desc']],
+        order: [[4, 'desc']],
         initComplete: function() {             
         }
     });
+    window.datatable.on('click', 'td.dt-control', function (e) {
+      let tr = e.target.closest('tr');
+      let row = window.datatable.row(tr);
+  
+      if (row.child.isShown()) {
+          // This row is already open - close it
+          row.child.hide();
+      }
+      else {
+          // Open this row
+          fetch("query/job_info?id="+row.data().id, {method: "GET"}
+            ).then(
+              response => response.text()
+            ).then(data=>{
+              row.child(data).show();
+            });
+      }
+  });
 });
 </script>
 {% endblock %}
\ No newline at end of file
diff --git a/webinterface/templates/dashboards/query_job_fragment.html b/webinterface/templates/dashboards/query_job_fragment.html
new file mode 100644
index 00000000..36314c81
--- /dev/null
+++ b/webinterface/templates/dashboards/query_job_fragment.html
@@ -0,0 +1,29 @@
+<table>
+    <tr>
+        <th>
+        </th>
+        <th>
+            Accession
+        </th>
+        <th>
+            Ended at
+        </th>
+        <th>
+            Status
+        </th>
+        <th>
+            Progress
+        </th>
+    </tr>
+
+    </th>
+    {% for job in subjob_info %}
+    <tr>
+        <td></td>
+        <td>{{job['accession']}}</td>
+        <td>{{job['ended_at'] or ''}}</td>
+        <td>{{job['status']}}</td>
+        <td>{{job['progress'] or ''}}</td>
+    </tr>
+    {% endfor %}
+</table>
\ No newline at end of file

From 0f753e0db5feac2c0354d9ab27016d63835b6185 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 31 May 2024 23:23:29 +0000
Subject: [PATCH 03/42] create dummy files

---
 webinterface/dashboards/query.py | 15 ++++++++++++---
 1 file changed, 12 insertions(+), 3 deletions(-)

diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
index 8dd692de..81170039 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query.py
@@ -1,4 +1,6 @@
 
+from pathlib import Path
+import shutil
 from webinterface.query import SimpleDicomClient
 # Standard python includes
 from datetime import datetime
@@ -34,7 +36,8 @@ def query_job(*,accession, node):
         job.save_meta()
     return "Complete"
 
-def dummy_job(*,accession, node):
+def dummy_job(*,accession, node, path):
+    Path(path).mkdir(parents=True, exist_ok=True)
     total_time = 3  # Total time for the job in seconds (1 minute)
     update_interval = 1  # Interval between updates in seconds
 
@@ -58,6 +61,7 @@ def dummy_job(*,accession, node):
     job.save_meta()
     while (time.monotonic() - start_time) < total_time:
         time.sleep(update_interval)  # Sleep for the interval duration
+        (Path(path) / f"dummy{completed}_{job.id}.dcm").touch()
         remaining -= 1
         completed += 1
 
@@ -75,8 +79,10 @@ def dummy_job(*,accession, node):
         job_parent.save_meta()
     return "Job complete"
 
-def batch_job(*, accessions, subjobs):
-    print(subjobs)
+def batch_job(*, accessions, subjobs, path):
+    for p in Path(path).glob("**/*.dcm"):
+        shutil.move(p, "/opt/mercure/data/incoming")
+    shutil.rmtree(path)
     return "Batch complete"
 
 def monitor_job():
@@ -123,6 +129,9 @@ async def query_post_batch(request):
         full_job = Job.create(batch_job, kwargs=dict(accessions=random_accessions, subjobs=[j.id for j in jobs]), timeout=-1, result_ttl=-1, meta=dict(type="batch", started=0, completed=0, total=len(jobs)), depends_on=[j.id for j in jobs])
         for j in jobs:
             j.meta["parent"] = full_job.id
+            j.kwargs["path"] = f"/opt/mercure/data/query/job_dirs/{full_job.id}/{j.kwargs['accession']}"
+        full_job.kwargs["path"] = Path(f"/opt/mercure/data/query/job_dirs/{full_job.id}")
+
 
     for j in jobs:
         worker_queue.enqueue_job(j)

From e3a86eda69392f3c00c0a471d53603c65c4978d3 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 7 Jun 2024 22:54:17 +0000
Subject: [PATCH 04/42] - pause/resume jobs - redirect results to folder

---
 common/types.py                              |   7 +-
 webinterface/common.py                       |   3 +
 webinterface/dashboards/query.py             | 200 ++++++++++++++-----
 webinterface/templates/dashboards/query.html |  95 ++++++++-
 4 files changed, 248 insertions(+), 57 deletions(-)

diff --git a/common/types.py b/common/types.py
index 9558db6c..aaba7738 100755
--- a/common/types.py
+++ b/common/types.py
@@ -185,9 +185,14 @@ class DicomNode(BaseModel):
     aet_target: str
     aet_source: Optional[str] = ""
 
+class DicomDestination(BaseModel):
+    name: str
+    path: str
+
 class DicomRetrieveConfig(BaseModel):
     dicom_nodes: List[DicomNode] = []
-
+    destination_folders: List[DicomDestination] = []
+    
 class Config(BaseModel, Compat):
     appliance_name: str
     port: int
diff --git a/webinterface/common.py b/webinterface/common.py
index 25a35efd..d0692a89 100755
--- a/webinterface/common.py
+++ b/webinterface/common.py
@@ -17,6 +17,9 @@
 from rq_scheduler import Scheduler
 
 redis = Redis()
+
+
+
 worker_queue = Queue(connection=redis)
 worker_scheduler = Scheduler(queue=worker_queue, connection=worker_queue.connection) 
 
diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
index 81170039..eca892da 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query.py
@@ -20,6 +20,8 @@
 from .common import router
 logger = config.get_logger()
 
+
+
 def query_job(*,accession, node):
     config.read_config()
     c = SimpleDicomClient(node.ip, node.port, node.aet_target, config.mercure.incoming_folder)
@@ -36,9 +38,10 @@ def query_job(*,accession, node):
         job.save_meta()
     return "Complete"
 
+
 def dummy_job(*,accession, node, path):
     Path(path).mkdir(parents=True, exist_ok=True)
-    total_time = 3  # Total time for the job in seconds (1 minute)
+    total_time = 10  # Total time for the job in seconds (1 minute)
     update_interval = 1  # Interval between updates in seconds
 
     start_time = time.monotonic()
@@ -61,7 +64,10 @@ def dummy_job(*,accession, node, path):
     job.save_meta()
     while (time.monotonic() - start_time) < total_time:
         time.sleep(update_interval)  # Sleep for the interval duration
-        (Path(path) / f"dummy{completed}_{job.id}.dcm").touch()
+        out_file = (Path(path) / f"dummy{completed}_{job.id}.dcm")
+        if out_file.exists():
+            raise Exception(f"{out_file} exists already")
+        out_file.touch()
         remaining -= 1
         completed += 1
 
@@ -73,21 +79,82 @@ def dummy_job(*,accession, node, path):
         job.save_meta()  # Save the updated meta data to the job
     
     if job_parent:
+        job_parent.get_meta() # there is technically a race condition here...
         job_parent.meta['completed'] += 1
-        job_parent.meta['progress'] = f"{job_parent.meta['completed'] } / {job_parent.meta['total']}"
+        job_parent.meta['progress'] = f"{job_parent.meta['started'] } / {job_parent.meta['completed'] } / {job_parent.meta['total']}"
 
         job_parent.save_meta()
     return "Job complete"
 
-def batch_job(*, accessions, subjobs, path):
-    for p in Path(path).glob("**/*.dcm"):
-        shutil.move(p, "/opt/mercure/data/incoming")
+def batch_job(*, accessions, subjobs, path, destination):
+    job = get_current_job()
+    job.save_meta()
+    logger.info(f"Job completing {job.id}")
+    logger.info(path)
+    if destination is None:
+        for p in Path(path).glob("**/*"):
+            if p.is_file():
+                shutil.move(p, config.mercure.incoming_folder)
+    else:
+        dest_folder: Path = Path(destination) / job.id
+        dest_folder.mkdir()
+        for p in Path(path).iterdir():
+            if p.is_dir():
+                logger.info(f"moving {p} to {dest_folder}")
+                shutil.move(p, dest_folder)
+
     shutil.rmtree(path)
-    return "Batch complete"
+    return "Job complete"
+
+
 
 def monitor_job():
     print("monitoring")
 
+@router.post("/query/pause_job")
+@requires(["authenticated", "admin"], redirect="login")
+async def pause_job(request):
+    job = worker_queue.fetch_job(request.query_params['id'])
+    if not job:
+        return JSONResponse({'error': 'Job not found'}, status_code=404)
+    if job.is_finished or job.is_failed:
+        return JSONResponse({'error': 'Job is already finished'}, status_code=400)
+
+    for job_id in job.kwargs.get('subjobs',[]):
+        subjob = worker_queue.fetch_job(job_id)
+        if subjob and (subjob.is_deferred or subjob.is_queued):
+            subjob.meta['paused'] = True
+            subjob.save_meta()
+            subjob.cancel()
+    job.meta['paused'] = True
+    job.save_meta()
+    return JSONResponse({'status': 'success'}, status_code=200)
+
+@router.post("/query/resume_job")
+@requires(["authenticated", "admin"], redirect="login")
+async def resume_job(request):
+    job = worker_queue.fetch_job(request.query_params['id'])
+    if not job:
+        return JSONResponse({'error': 'Job not found'}, status_code=404)
+    if job.is_finished or job.is_failed:
+        return JSONResponse({'error': 'Job is already finished'}, status_code=400)
+    # if not job.meta.get('paused', False):
+    #     return JSONResponse({'error': 'Job is not paused'}, status_code=400)
+
+    for subjob_id in job.kwargs.get('subjobs',[]):
+        subjob = worker_queue.fetch_job(subjob_id)
+        if subjob and subjob.meta.get('paused', None):
+            subjob.meta['paused'] = False
+            subjob.save_meta()
+            worker_queue.canceled_job_registry.requeue(subjob_id)
+            # worker_queue.canceled_job_registry.remove(subjob_id)
+    job.get_meta()
+    job.meta['paused'] = False
+    job.save_meta()
+    # worker_queue.canceled_job_registry.requeue(job.id)
+    # worker_queue.canceled_job_registry.remove(job.id)
+    return JSONResponse({'status': 'success'}, status_code=200)
+
 @router.get("/query/job_info")
 @requires(["authenticated", "admin"], redirect="login")
 async def get_job_info(request):
@@ -97,17 +164,21 @@ async def get_job_info(request):
         return JSONResponse({'error': 'Job not found'}, status_code=404)
     
     subjob_info = []
-    for job_id in job.kwargs.get('subjobs',[]):
-        subjob = worker_queue.fetch_job(job_id)
-        if subjob:
-            subjob_info.append({'id': subjob.get_id(),
-                                'ended_at': subjob.ended_at.isoformat().split('.')[0] if subjob.ended_at else "", 
-                                'created_at_dt':subjob.created_at,
-                                'accession': subjob.kwargs['accession'],
-                                'progress': subjob.meta.get('progress'),
-                                'status': subjob.get_status()})
+    subjobs = (worker_queue.fetch_job(job) for job in job.kwargs.get('subjobs', []))
+    for subjob in subjobs:
+        info = {'id': subjob.get_id(),
+                'ended_at': subjob.ended_at.isoformat().split('.')[0] if subjob.ended_at else "", 
+                'created_at_dt':subjob.created_at,
+                'accession': subjob.kwargs['accession'],
+                'progress': subjob.meta.get('progress'),
+                'paused': subjob.meta.get('paused',False),
+                'status': subjob.get_status()
+            }
+        if info['status'] == 'canceled' and info['paused']:
+            info['status'] = 'paused'
+        subjob_info.append(info)
     subjob_info = sorted(subjob_info, key=lambda x:x['created_at_dt'])
-    return templates.TemplateResponse("dashboards/query_job_fragment.html", {"request":request,"subjob_info":subjob_info})
+    return templates.TemplateResponse("dashboards/query_job_fragment.html", {"request":request,"job":job,"subjob_info":subjob_info})
 
 @router.post("/query")
 @requires(["authenticated", "admin"], redirect="login")
@@ -120,18 +191,22 @@ async def query_post_batch(request):
         if n.name == form.get("dicom_node"):
             node = n
             break
-    random_accessions = ["".join(random.choices([str(i) for i in range(10)], k=10)) for _ in range(5)]
+    destination = form.get("destination")
+    for d in config.mercure.dicom_retrieve.destination_folders:
+        if d.name == destination:
+            destination_path = d.path
+    random_accessions = ["".join(random.choices([str(i) for i in range(10)], k=5)) for _ in range(3)]
     jobs = []
     with Connection(redis):
         for accession in random_accessions:
-            job = Job.create(dummy_job, kwargs=dict(accession=accession, node=node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_batch",parent=None))
+            job = Job.create(dummy_job, kwargs=dict(accession=accession, node=node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_batch",parent=None, paused=False))
             jobs.append(job)
-        full_job = Job.create(batch_job, kwargs=dict(accessions=random_accessions, subjobs=[j.id for j in jobs]), timeout=-1, result_ttl=-1, meta=dict(type="batch", started=0, completed=0, total=len(jobs)), depends_on=[j.id for j in jobs])
+        full_job = Job.create(batch_job, kwargs=dict(accessions=random_accessions, subjobs=[j.id for j in jobs], destination=destination_path), timeout=-1, result_ttl=-1, meta=dict(type="batch", started=0, paused=False,completed=0, total=len(jobs)), depends_on=[j.id for j in jobs])
         for j in jobs:
             j.meta["parent"] = full_job.id
             j.kwargs["path"] = f"/opt/mercure/data/query/job_dirs/{full_job.id}/{j.kwargs['accession']}"
         full_job.kwargs["path"] = Path(f"/opt/mercure/data/query/job_dirs/{full_job.id}")
-
+        full_job.kwargs["path"].mkdir(parents=True)
 
     for j in jobs:
         worker_queue.enqueue_job(j)
@@ -164,38 +239,59 @@ async def query_jobs(request):
         worker_queue.finished_job_registry,  # Returns FinishedJobRegistry
         worker_queue.failed_job_registry,  # Returns FailedJobRegistry 
         worker_queue.scheduled_job_registry,  # Returns ScheduledJobRegistry
+        worker_queue.canceled_job_registry,   # Returns CanceledJobRegistry
     ]
     job_info = []
-    for r in registries:
-        for j_id in r.get_job_ids():
-            job = worker_queue.fetch_job(j_id)
-            if job.meta.get('type') != 'batch':
-                continue
-            job_dict = dict(id=j_id, 
-                                 status=job.get_status(), 
-                                 parameters=dict(accession=job.kwargs.get('accession','')), 
-                                 created_at=1000*datetime.timestamp(job.created_at) if job.created_at else "",
-                                 enqueued_at=1000*datetime.timestamp(job.enqueued_at) if job.enqueued_at else "", 
-                                 result=job.result, 
-                                 meta=job.meta,
-                                 progress="")
-            # if job.meta.get('completed') and job.meta.get('remaining'):
-            #     job_dict["progress"] = f"{job.meta.get('completed')} / {job.meta.get('completed') + job.meta.get('remaining')}"
-            # if job.meta.get('type',None) == "batch":
-            n_started = job.meta.get('started',0)
-            n_completed = job.meta.get('completed',0)
-            n_total = job.meta.get('total',0)
-
-            if job_dict["status"] == "finished":
-                job_dict["progress"] = f"{n_total} / {n_total}"
-            elif job_dict["status"] in ("deferred","started"):
-                job_dict["progress"] = f"{n_completed} / {n_total}"
-                if 0 < n_started < n_total:
-                    job_dict["status"] = "running"
-                elif n_completed == n_total:
-                    job_dict["status"] = "finishing"
-
-            job_info.append(job_dict)
+    # logger.info(worker_queue.job_ids)
+    # for registry in registries:
+    job_ids = set()
+    for registry in registries:
+        for j_id in registry.get_job_ids():
+            job_ids.add(j_id)
+    for j_id in worker_queue.job_ids:
+        job_ids.add(j_id)
+
+    for j_id in job_ids:
+        job = worker_queue.fetch_job(j_id)
+        job_meta = job.get_meta()
+        if job_meta.get('type') != 'batch':
+            continue
+        job_dict = dict(id=j_id, 
+                                status=job.get_status(), 
+                                parameters=dict(accession=job.kwargs.get('accession','')), 
+                                created_at=1000*datetime.timestamp(job.created_at) if job.created_at else "",
+                                enqueued_at=1000*datetime.timestamp(job.enqueued_at) if job.enqueued_at else "", 
+                                result=job.result, 
+                                meta=job_meta,
+                                progress="")
+        # if job.meta.get('completed') and job.meta.get('remaining'):
+        #     job_dict["progress"] = f"{job.meta.get('completed')} / {job.meta.get('completed') + job.meta.get('remaining')}"
+        # if job.meta.get('type',None) == "batch":
+        n_started = job_meta.get('started',0)
+        n_completed = job_meta.get('completed',0)
+        n_total = job_meta.get('total',0)
+
+        if job_dict["status"] == "finished":
+            job_dict["progress"] = f"{n_total} / {n_total}"
+        elif job_dict["status"] in ("deferred","started", "paused", "canceled"):
+            job_dict["progress"] = f"{n_completed} / {n_total}"
+        
+        # if job_dict["status"] == "canceled" and 
+        if job_dict["meta"].get('paused', False):
+            if n_started < n_completed: # TODO: this does not work
+                job_dict["status"] = "pausing"
+            else:
+                job_dict["status"] = "paused"
+
+        if job_dict["status"] in ("deferred", "started"):
+            if n_started == 0:
+                job_dict["status"] = "waiting"
+            elif n_completed < n_total:
+                job_dict["status"] = "running"
+            elif n_completed == n_total:
+                job_dict["status"] = "finishing"
+
+        job_info.append(job_dict)
     return JSONResponse(dict(data=job_info))
     # return PlainTextResponse(",".join([str(j) for j in all_jobs]))
 
@@ -205,7 +301,7 @@ async def query(request):
     template = "dashboards/query.html"
     context = {
         "request": request,
-        
+        "destination_folders": config.mercure.dicom_retrieve.destination_folders,
         "dicom_nodes": config.mercure.dicom_retrieve.dicom_nodes,
         "page": "query",
     }
diff --git a/webinterface/templates/dashboards/query.html b/webinterface/templates/dashboards/query.html
index f595df46..085cc209 100644
--- a/webinterface/templates/dashboards/query.html
+++ b/webinterface/templates/dashboards/query.html
@@ -44,7 +44,26 @@ <h1 class="title">DICOM Query</h1>
                 </div>
               </div>
             </div>
-
+            <div class="field is-horizontal">
+              <div class="field-label is-normal">
+                <label class="label">Destination</label>
+              </div>
+              <div class="field-body">
+                <div class="field">
+                  <div class="control is-expanded">
+                    <div class="select">
+                        <select name="destination">
+                          <option>Mercure</option>
+                          <option disabled>————————</option>
+                          {% for destination in destination_folders %}
+                          <option>{{ destination.name }}</option>
+                          {% endfor %}
+                        </select>
+                      </div>
+                  </div>
+                </div>
+              </div>
+            </div>
             <div class="field is-horizontal">
               <div class="field-label">
                 <!-- Left empty for spacing -->
@@ -59,7 +78,6 @@ <h1 class="title">DICOM Query</h1>
                 </div>
               </div>
             </div>
-          </div> 
           </form>
           <div id="query_result"></div>
         <div class="columns">
@@ -84,12 +102,45 @@ <h1 class="title">DICOM Query</h1>
             </div>
             </div>
     </div>
+  </div> 
+
 </main>
 <script>
 $(document).ready(function () {      
     $("#form").on('htmx:afterOnLoad', (event) => {
         datatable.ajax.reload();
-});
+  });
+
+  function namespacedEvents(config) {
+        var unique = config._eventNamespace;
+        return 'draw.dt.DT' + unique + ' select.dt.DT' + unique + ' deselect.dt.DT' + unique;
+  }
+    var _buttonNamespace = 0;
+    my_selected_button = {
+		text: 'Selected',
+		className: 'buttons-selected',
+        enabled: function(dt,config) {
+           rows = dt.rows({ selected: true });
+           return rows.any();
+        },
+		init: function (dt, node, config) {
+			var that = this;
+			config._eventNamespace = '.select' + _buttonNamespace++;
+			// .DT namespace listeners are removed by DataTables automatically
+			// on table destroy
+      // console.log(config);
+			dt.on(namespacedEvents(config), function () {
+				that.enable(config.enabled(dt, node, config));
+			});
+
+			this.disable();
+		},
+		destroy: function (dt, node, config) {
+			dt.off(config._eventNamespace);
+		}}
+
+    $.fn.dataTable.ext.buttons.customEnable = my_selected_button;
+
     window.datatable = $('#casetable').DataTable({           
         dom: "<'row browsertoolbar align-items-end'<'col-sm-12 col-md-7 browserbuttons'B><'col-sm-12 col-md-2'><'col-sm-12 col-md-3'f>>" + "<'row'<'col-sm-12'tr>>" + "<'row browserfooterbar'<'col-sm-12 col-md-5'l><'col-sm-12 col-md-7'p>>",
         ajax: "query/jobs",
@@ -117,7 +168,43 @@ <h1 class="title">DICOM Query</h1>
             "emptyTable": "No messages available on server."
         },
         // filter: true,
-        buttons: [],
+        buttons: [
+          {
+                    extend: "customEnable",
+                    text: '<i class="fas fa-pause"></i>',
+                    titleAttr: 'Pause/Resume',
+                    enabled: function(dt, node, config) {
+                      let data = dt.row({selected: true}).data();
+                      console.log(node);
+                      if (!data) {
+                          return false;
+                      }
+                      if (data.status == "paused") {
+                        node.html('<i class="fas fa-play"></i>')
+                      } else {
+                        node.html('<i class="fas fa-pause"></i>')
+                      }
+                      return (data.status == "paused" || data.status == "deferred" || data.status == "queued" || data.status == "running");
+                    },
+                    action: function (e, dt, node, config) {
+                        let data = dt.row({selected: true}).data();
+                        
+                        if (data.status == "paused") {
+                          operation = "resume";
+                        } else if (data.status == "deferred" || data.status == "running" || data.status == "queued")  {
+                          operation = "pause";
+                        } else {
+                          alert("???");
+                          return;
+                        }
+                        fetch(`query/${operation}_job?id=${data.id}`, {method:"POST"}).then(()=>{
+                            dt.ajax.reload()
+                        }).catch((err)=>{
+                            console.log("Error: ", err)
+                        })
+                    }
+                },
+        ],
         order: [[4, 'desc']],
         initComplete: function() {             
         }

From be44196b379b6a1117a4ac055cae4bdc8067fce6 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Wed, 12 Jun 2024 21:46:37 +0000
Subject: [PATCH 05/42] - batch jobs fail if a subjob fails - retry failed jobs
 - offpeak-only jobs

---
 requirements.in                              |   2 +-
 requirements.txt                             |  24 +-
 webgui.py                                    |  12 +
 webinterface/dashboards/query.py             | 338 ++++++++++++-------
 webinterface/templates/dashboards/query.html |  39 ++-
 5 files changed, 281 insertions(+), 134 deletions(-)

diff --git a/requirements.in b/requirements.in
index ca789b3e..8efb12d1 100644
--- a/requirements.in
+++ b/requirements.in
@@ -31,7 +31,7 @@ aiofiles
 jinja2
 types-Jinja2
 # 0.15.0 breaks session management; the next commit after 0.18 will include the fix
-starlette ~= 0.28; 
+starlette ~= 0.28
 starlette-auth-toolkit
 uvicorn == 0.16.0
 itsdangerous
diff --git a/requirements.txt b/requirements.txt
index 66a94595..66d077af 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,9 +1,5 @@
-#
-# This file is autogenerated by pip-compile with Python 3.10
-# by the following command:
-#
-#    pip-compile
-#
+# This file was autogenerated by uv via the following command:
+#    uv pip compile requirements.in -o requirements.txt --no-strip-extras
 aiofiles==23.2.1
     # via -r requirements.in
 aiohttp==3.9.3
@@ -49,6 +45,8 @@ click==8.1.7
     # via
     #   rq
     #   uvicorn
+crontab==1.0.1
+    # via rq-scheduler
 daiquiri==3.2.5.1
     # via -r requirements.in
 databases[aiopg]==0.8.0
@@ -68,7 +66,9 @@ exceptiongroup==1.2.0
     #   anyio
     #   pytest
 freezegun==1.4.0
-    # via -r requirements.in
+    # via
+    #   -r requirements.in
+    #   rq-scheduler
 frozenlist==1.4.1
     # via
     #   aiohttp
@@ -169,6 +169,7 @@ python-dateutil==2.8.2
     #   botocore
     #   freezegun
     #   influxdb-client
+    #   rq-scheduler
 python-json-logger==2.0.7
     # via daiquiri
 python-multipart==0.0.9
@@ -191,9 +192,15 @@ requests==2.31.0
 retrying==1.3.4
     # via dicomweb-client
 rq==1.16.2
+    # via
+    #   -r requirements.in
+    #   rq-scheduler
+rq-scheduler==0.13.1
     # via -r requirements.in
 s3transfer==0.10.0
     # via boto3
+setuptools==70.0.0
+    # via influxdb-client
 six==1.16.0
     # via
     #   python-dateutil
@@ -272,6 +279,3 @@ wheel==0.42.0
     # via -r requirements.in
 yarl==1.9.4
     # via aiohttp
-
-# The following packages are considered to be unsafe in a requirements file:
-# setuptools
diff --git a/webgui.py b/webgui.py
index 41ff981e..d41d11aa 100755
--- a/webgui.py
+++ b/webgui.py
@@ -127,6 +127,18 @@ async def authenticate(self, request):
 
 
 def startup() -> None:
+    scheduled_jobs = worker_scheduler.get_jobs()
+    for job in scheduled_jobs: 
+        if job.meta.get("type") != "offpeak":
+            continue
+        worker_scheduler.cancel(job)
+    worker_scheduler.schedule(
+        scheduled_time=datetime.datetime.utcnow(),
+        func=dashboards.query.update_jobs_offpeak,
+        interval=60,
+        meta={"type": "offpeak"},
+        repeat=None
+    )
     monitor.configure("webgui", "main", config.mercure.bookkeeper)
     monitor.send_event(monitor.m_events.BOOT, monitor.severity.INFO, f"PID = {os.getpid()}")
 
diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
index eca892da..ddd4dc6c 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query.py
@@ -14,7 +14,8 @@
 import common.config as config
 from starlette.responses import PlainTextResponse, JSONResponse
 from webinterface.common import worker_queue, redis
-from rq import Connection
+from rq import Connection 
+from rq.job import Dependency
 from rq import get_current_job
 from rq.job import Job
 from .common import router
@@ -40,57 +41,81 @@ def query_job(*,accession, node):
 
 
 def dummy_job(*,accession, node, path):
-    Path(path).mkdir(parents=True, exist_ok=True)
-    total_time = 10  # Total time for the job in seconds (1 minute)
-    update_interval = 1  # Interval between updates in seconds
-
-    start_time = time.monotonic()
+    print(f"Getting {accession}")
     job = get_current_job()
-    if job.meta.get('parent'):
-        job_parent = worker_queue.fetch_job(job.meta['parent'])
-    else:
-        job_parent = None
-    # failed = 0
-    remaining = total_time // update_interval
-    completed = 0
-    print(accession)
-    if job_parent:
-        job_parent.meta['started'] = job_parent.meta.get('started',0) + 1
-        job_parent.save_meta()
-
-    job.meta['started'] = 1
-    job.meta['total'] = remaining
-    job.meta['progress'] = f"0 / {job.meta['total']}"
-    job.save_meta()
-    while (time.monotonic() - start_time) < total_time:
-        time.sleep(update_interval)  # Sleep for the interval duration
-        out_file = (Path(path) / f"dummy{completed}_{job.id}.dcm")
-        if out_file.exists():
-            raise Exception(f"{out_file} exists already")
-        out_file.touch()
-        remaining -= 1
-        completed += 1
-
-        # job.meta['failed'] = failed
-        job.meta['remaining'] = remaining
-        job.meta['completed'] = completed
-        job.meta['progress'] = f"{completed} / {job.meta['total']}"
-        print(job.meta['progress'])
-        job.save_meta()  # Save the updated meta data to the job
-    
-    if job_parent:
-        job_parent.get_meta() # there is technically a race condition here...
-        job_parent.meta['completed'] += 1
-        job_parent.meta['progress'] = f"{job_parent.meta['started'] } / {job_parent.meta['completed'] } / {job_parent.meta['total']}"
+    try:
+        Path(path).mkdir(parents=True, exist_ok=True)
+        total_time = 10  # Total time for the job in seconds (1 minute)
+        update_interval = 1  # Interval between updates in seconds
+
+        start_time = time.monotonic()
+        if job.meta.get('parent'):
+            job_parent = worker_queue.fetch_job(job.meta['parent'])
+        else:
+            job_parent = None
+        # failed = 0
+        remaining = total_time // update_interval
+        completed = 0
+
+        if job_parent:
+            job_parent.meta['started'] = job_parent.meta.get('started',0) + 1
+            job_parent.save_meta()
+
+        job.meta['started'] = 1
+        job.meta['total'] = remaining
+        job.meta['progress'] = f"0 / {job.meta['total']}"
+        job.save_meta()
+        while (time.monotonic() - start_time) < total_time:
+            time.sleep(update_interval)  # Sleep for the interval duration
+            out_file = (Path(path) / f"dummy{completed}_{job.id}.dcm")
+            if out_file.exists():
+                raise Exception(f"{out_file} exists already")
+            out_file.touch()
+            remaining -= 1
+            completed += 1
+
+            # job.meta['failed'] = failed
+            job.meta['remaining'] = remaining
+            job.meta['completed'] = completed
+            job.meta['progress'] = f"{completed} / {job.meta['total']}"
+            print(job.meta['progress'])
+            job.save_meta()  # Save the updated meta data to the job
+        
+        if job_parent:
+            job_parent.get_meta() # there is technically a race condition here...
+            job_parent.meta['completed'] += 1
+            job_parent.meta['progress'] = f"{job_parent.meta['started'] } / {job_parent.meta['completed'] } / {job_parent.meta['total']}"
+
+            job_parent.save_meta()
+    except:
+        if not job_parent:
+            raise
+        # Cancel remaining sibling jobs
+        logger.info("Cancelling sibling jobs.")
+        for subjob_id in job_parent.kwargs.get('subjobs',[]):
+            if subjob_id == job.id:
+                continue
+            subjob = worker_queue.fetch_job(subjob_id)
+            if subjob.get_status() not in ('finished', 'canceled','failed'):
+                subjob.cancel()
+        job_parent.get_meta() 
+        logger.info("Cancelled sibling jobs.")
+        worker_queue._enqueue_job(job_parent) # Force the parent job to run and fail itself
+        raise
 
-        job_parent.save_meta()
     return "Job complete"
 
 def batch_job(*, accessions, subjobs, path, destination):
     job = get_current_job()
-    job.save_meta()
+    job.get_meta()
+    for job_id in job.kwargs.get('subjobs',[]):
+        subjob = worker_queue.fetch_job(job_id)
+        if (status := subjob.get_status()) != 'finished':
+            raise Exception(f"Subjob {subjob.id} is {status}")
+
     logger.info(f"Job completing {job.id}")
     logger.info(path)
+    config.read_config()
     if destination is None:
         for p in Path(path).glob("**/*"):
             if p.is_file():
@@ -111,48 +136,147 @@ def batch_job(*, accessions, subjobs, path, destination):
 def monitor_job():
     print("monitoring")
 
-@router.post("/query/pause_job")
-@requires(["authenticated", "admin"], redirect="login")
-async def pause_job(request):
-    job = worker_queue.fetch_job(request.query_params['id'])
-    if not job:
-        return JSONResponse({'error': 'Job not found'}, status_code=404)
-    if job.is_finished or job.is_failed:
-        return JSONResponse({'error': 'Job is already finished'}, status_code=400)
-
+def pause_job(job: Job):
     for job_id in job.kwargs.get('subjobs',[]):
         subjob = worker_queue.fetch_job(job_id)
         if subjob and (subjob.is_deferred or subjob.is_queued):
             subjob.meta['paused'] = True
             subjob.save_meta()
             subjob.cancel()
+    job.get_meta()
     job.meta['paused'] = True
     job.save_meta()
-    return JSONResponse({'status': 'success'}, status_code=200)
-
-@router.post("/query/resume_job")
-@requires(["authenticated", "admin"], redirect="login")
-async def resume_job(request):
-    job = worker_queue.fetch_job(request.query_params['id'])
-    if not job:
-        return JSONResponse({'error': 'Job not found'}, status_code=404)
-    if job.is_finished or job.is_failed:
-        return JSONResponse({'error': 'Job is already finished'}, status_code=400)
-    # if not job.meta.get('paused', False):
-    #     return JSONResponse({'error': 'Job is not paused'}, status_code=400)
 
+def resume_job(job: Job):
     for subjob_id in job.kwargs.get('subjobs',[]):
         subjob = worker_queue.fetch_job(subjob_id)
         if subjob and subjob.meta.get('paused', None):
             subjob.meta['paused'] = False
             subjob.save_meta()
             worker_queue.canceled_job_registry.requeue(subjob_id)
-            # worker_queue.canceled_job_registry.remove(subjob_id)
     job.get_meta()
     job.meta['paused'] = False
     job.save_meta()
-    # worker_queue.canceled_job_registry.requeue(job.id)
-    # worker_queue.canceled_job_registry.remove(job.id)
+
+def create_job(accessions, dicom_node, destination_path, offpeak=False) -> Job:
+    with Connection(redis):
+        jobs = []
+        for accession in accessions:
+            job = Job.create(dummy_job, kwargs=dict(accession=accession, node=dicom_node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_batch",parent=None, paused=False, offpeak=offpeak))
+            jobs.append(job)
+        depends = Dependency(
+            jobs=jobs,
+            allow_failure=True,    # allow_failure defaults to False
+        )
+        full_job = Job.create(batch_job, kwargs=dict(accessions=accessions, subjobs=[j.id for j in jobs], destination=destination_path), timeout=-1, result_ttl=-1, meta=dict(type="batch", started=0, paused=False,completed=0, total=len(jobs), offpeak=offpeak), depends_on=depends)
+        for j in jobs:
+            j.meta["parent"] = full_job.id
+            j.kwargs["path"] = f"/opt/mercure/data/query/job_dirs/{full_job.id}/{j.kwargs['accession']}"
+        full_job.kwargs["path"] = Path(f"/opt/mercure/data/query/job_dirs/{full_job.id}")
+        full_job.kwargs["path"].mkdir(parents=True)
+    for j in jobs:
+        worker_queue.enqueue_job(j)
+    worker_queue.enqueue_job(full_job)
+
+    if offpeak and not _is_offpeak(config.mercure.offpeak_start, config.mercure.offpeak_end, datetime.now().time()):
+        pause_job(full_job)
+
+    return full_job
+
+def retry_job(job):
+    # job.meta["retries"] = job.meta.get("retries", 0) + 1
+    # if job.meta["retries"] > 3:
+    #     return False
+    logger.info(f"Retrying {job}")
+    for subjob in get_subjobs(job):
+        if (status:=job.get_status()) in ("failed", "canceled"):
+            logger.info(f"Retrying {subjob}")
+            if status == "failed" and (job_path:=Path(subjob.kwargs['path'])).exists():
+                shutil.rmtree(job_path) # Clean up after a failed job
+            worker_queue.enqueue_job(subjob)
+    worker_queue.enqueue_job(job)
+def get_subjobs(job):
+    return (worker_queue.fetch_job(job) for job in job.kwargs.get('subjobs', []))
+
+def get_all_jobs(type):
+    registries = [
+        worker_queue.started_job_registry,  # Returns StartedJobRegistry
+        worker_queue.deferred_job_registry,   # Returns DeferredJobRegistry
+        worker_queue.finished_job_registry,  # Returns FinishedJobRegistry
+        worker_queue.failed_job_registry,  # Returns FailedJobRegistry 
+        worker_queue.scheduled_job_registry,  # Returns ScheduledJobRegistry
+        worker_queue.canceled_job_registry,   # Returns CanceledJobRegistry
+    ]
+    job_ids = set()
+    for registry in registries:
+        for j_id in registry.get_job_ids():
+            job_ids.add(j_id)
+    for j_id in worker_queue.job_ids:
+        job_ids.add(j_id)
+    jobs = (worker_queue.fetch_job(j_id) for j_id in job_ids)
+
+    return (j for j in jobs if j.get_meta().get("type") == type)
+
+def _is_offpeak(offpeak_start: str, offpeak_end: str, current_time) -> bool:
+    try:
+        start_time = datetime.strptime(offpeak_start, "%H:%M").time()
+        end_time = datetime.strptime(offpeak_end, "%H:%M").time()
+    except Exception as e:
+        logger.error(f"Unable to parse offpeak time: {offpeak_start}, {offpeak_end}", None)  # handle_error
+        return True
+
+    if start_time < end_time:
+        return current_time >= start_time and current_time <= end_time
+    # End time is after midnight
+    return current_time >= start_time or current_time <= end_time
+
+def update_jobs_offpeak():
+    config.read_config()
+    is_offpeak = _is_offpeak(config.mercure.offpeak_start, config.mercure.offpeak_end, datetime.now().time())
+    logger.info(f"is_offpeak {is_offpeak}")
+    for job in get_all_jobs("batch"):
+        if not job.meta.get("offpeak"):
+            continue
+        if job.get_status() not in ("waiting", "running", "queued", "deferred"):
+            continue
+
+        if is_offpeak:
+            logger.info(f"{job.meta}, {job.get_status()}")
+            if job.meta.get("paused", False):
+                logger.info("Resuming")
+                resume_job(job)
+        else:
+            if not job.meta.get("paused", False):
+                logger.info("Pausing")
+                pause_job(job)
+
+@router.post("/query/retry_job")
+@requires(["authenticated", "admin"], redirect="login")
+async def test_offpeak(request):
+    job = worker_queue.fetch_job(request.query_params['id'])
+    retry_job(job)
+    return JSONResponse({})
+@router.post("/query/pause_job")
+@requires(["authenticated", "admin"], redirect="login")
+async def post_pause_job(request):
+    job = worker_queue.fetch_job(request.query_params['id'])
+    if not job:
+        return JSONResponse({'error': 'Job not found'}, status_code=404)
+    if job.is_finished or job.is_failed:
+        return JSONResponse({'error': 'Job is already finished'}, status_code=400)
+    pause_job(job)
+    return JSONResponse({'status': 'success'}, status_code=200)
+
+@router.post("/query/resume_job")
+@requires(["authenticated", "admin"], redirect="login")
+async def post_resume_job(request):
+    job = worker_queue.fetch_job(request.query_params['id'])
+    if not job:
+        return JSONResponse({'error': 'Job not found'}, status_code=404)
+    if job.is_finished or job.is_failed:
+        return JSONResponse({'error': 'Job is already finished'}, status_code=400)
+    
+    resume_job(job)
     return JSONResponse({'status': 'success'}, status_code=200)
 
 @router.get("/query/job_info")
@@ -166,7 +290,8 @@ async def get_job_info(request):
     subjob_info = []
     subjobs = (worker_queue.fetch_job(job) for job in job.kwargs.get('subjobs', []))
     for subjob in subjobs:
-        info = {'id': subjob.get_id(),
+        info = {
+                'id': subjob.get_id(),
                 'ended_at': subjob.ended_at.isoformat().split('.')[0] if subjob.ended_at else "", 
                 'created_at_dt':subjob.created_at,
                 'accession': subjob.kwargs['accession'],
@@ -180,6 +305,8 @@ async def get_job_info(request):
     subjob_info = sorted(subjob_info, key=lambda x:x['created_at_dt'])
     return templates.TemplateResponse("dashboards/query_job_fragment.html", {"request":request,"job":job,"subjob_info":subjob_info})
 
+
+
 @router.post("/query")
 @requires(["authenticated", "admin"], redirect="login")
 async def query_post_batch(request):
@@ -192,26 +319,15 @@ async def query_post_batch(request):
             node = n
             break
     destination = form.get("destination")
+    dest_path = None
     for d in config.mercure.dicom_retrieve.destination_folders:
         if d.name == destination:
-            destination_path = d.path
-    random_accessions = ["".join(random.choices([str(i) for i in range(10)], k=5)) for _ in range(3)]
-    jobs = []
-    with Connection(redis):
-        for accession in random_accessions:
-            job = Job.create(dummy_job, kwargs=dict(accession=accession, node=node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_batch",parent=None, paused=False))
-            jobs.append(job)
-        full_job = Job.create(batch_job, kwargs=dict(accessions=random_accessions, subjobs=[j.id for j in jobs], destination=destination_path), timeout=-1, result_ttl=-1, meta=dict(type="batch", started=0, paused=False,completed=0, total=len(jobs)), depends_on=[j.id for j in jobs])
-        for j in jobs:
-            j.meta["parent"] = full_job.id
-            j.kwargs["path"] = f"/opt/mercure/data/query/job_dirs/{full_job.id}/{j.kwargs['accession']}"
-        full_job.kwargs["path"] = Path(f"/opt/mercure/data/query/job_dirs/{full_job.id}")
-        full_job.kwargs["path"].mkdir(parents=True)
-
-    for j in jobs:
-        worker_queue.enqueue_job(j)
-    worker_queue.enqueue_job(full_job)
+            dest_path = d.path
+            break
 
+    random_accessions = ["".join(random.choices([str(i) for i in range(10)], k=10)) for _ in range(3)]
+    offpeak = 'offpeak' in form
+    create_job(random_accessions, node, dest_path, offpeak=offpeak)
     # worker_scheduler.schedule(scheduled_time=datetime.utcnow(), func=monitor_job, interval=10, repeat=10, result_ttl=-1)
     return PlainTextResponse()
 
@@ -230,46 +346,26 @@ async def query_post(request):
     worker_queue.enqueue_call(query_job, kwargs=dict(accession=form.get("accession"), node=node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_single"))
     return PlainTextResponse()
 
+
 @router.get("/query/jobs")
 @requires(["authenticated", "admin"], redirect="login")
 async def query_jobs(request):
-    registries = [
-        worker_queue.started_job_registry,  # Returns StartedJobRegistry
-        worker_queue.deferred_job_registry,   # Returns DeferredJobRegistry
-        worker_queue.finished_job_registry,  # Returns FinishedJobRegistry
-        worker_queue.failed_job_registry,  # Returns FailedJobRegistry 
-        worker_queue.scheduled_job_registry,  # Returns ScheduledJobRegistry
-        worker_queue.canceled_job_registry,   # Returns CanceledJobRegistry
-    ]
     job_info = []
-    # logger.info(worker_queue.job_ids)
-    # for registry in registries:
-    job_ids = set()
-    for registry in registries:
-        for j_id in registry.get_job_ids():
-            job_ids.add(j_id)
-    for j_id in worker_queue.job_ids:
-        job_ids.add(j_id)
-
-    for j_id in job_ids:
-        job = worker_queue.fetch_job(j_id)
-        job_meta = job.get_meta()
-        if job_meta.get('type') != 'batch':
-            continue
-        job_dict = dict(id=j_id, 
+    for job in get_all_jobs("batch"):
+        job_dict = dict(id=job.id, 
                                 status=job.get_status(), 
                                 parameters=dict(accession=job.kwargs.get('accession','')), 
                                 created_at=1000*datetime.timestamp(job.created_at) if job.created_at else "",
                                 enqueued_at=1000*datetime.timestamp(job.enqueued_at) if job.enqueued_at else "", 
                                 result=job.result, 
-                                meta=job_meta,
+                                meta=job.meta,
                                 progress="")
         # if job.meta.get('completed') and job.meta.get('remaining'):
         #     job_dict["progress"] = f"{job.meta.get('completed')} / {job.meta.get('completed') + job.meta.get('remaining')}"
         # if job.meta.get('type',None) == "batch":
-        n_started = job_meta.get('started',0)
-        n_completed = job_meta.get('completed',0)
-        n_total = job_meta.get('total',0)
+        n_started = job.meta.get('started',0)
+        n_completed = job.meta.get('completed',0)
+        n_total = job.meta.get('total',0)
 
         if job_dict["status"] == "finished":
             job_dict["progress"] = f"{n_total} / {n_total}"
@@ -277,19 +373,19 @@ async def query_jobs(request):
             job_dict["progress"] = f"{n_completed} / {n_total}"
         
         # if job_dict["status"] == "canceled" and 
-        if job_dict["meta"].get('paused', False):
+        if job_dict["meta"].get('paused', False) and job_dict["status"] not in ("finished", "failed"):
             if n_started < n_completed: # TODO: this does not work
                 job_dict["status"] = "pausing"
             else:
                 job_dict["status"] = "paused"
 
-        if job_dict["status"] in ("deferred", "started"):
-            if n_started == 0:
-                job_dict["status"] = "waiting"
-            elif n_completed < n_total:
-                job_dict["status"] = "running"
-            elif n_completed == n_total:
-                job_dict["status"] = "finishing"
+        # if job_dict["status"] in ("deferred", "started"):
+            # if n_started == 0:
+            #     job_dict["status"] = "waiting"
+            # elif n_completed < n_total:
+            #     job_dict["status"] = "running"
+            # elif n_completed == n_total:
+            #     job_dict["status"] = "finishing"
 
         job_info.append(job_dict)
     return JSONResponse(dict(data=job_info))
diff --git a/webinterface/templates/dashboards/query.html b/webinterface/templates/dashboards/query.html
index 085cc209..45ad8f5b 100644
--- a/webinterface/templates/dashboards/query.html
+++ b/webinterface/templates/dashboards/query.html
@@ -64,6 +64,22 @@ <h1 class="title">DICOM Query</h1>
                 </div>
               </div>
             </div>
+
+            <div class="field is-horizontal">
+              <div class="field-label is-normal">
+                <label class="label">Offpeak</label>
+              </div>
+              <div class="field-body">
+                <div class="field">
+                  <div class="control is-expanded">
+                    <label class="checkbox">
+                      <input type="checkbox" id="offpeak" name="offpeak" value="">
+                    </div>
+                  </div>
+                </div>
+              </div>
+            </div>
+
             <div class="field is-horizontal">
               <div class="field-label">
                 <!-- Left empty for spacing -->
@@ -153,7 +169,7 @@ <h1 class="title">DICOM Query</h1>
                 defaultContent: ''
             },
             { data: 'id' },
-            { data: 'meta', render: data => data["type"]? data["type"]:"" },
+            { data: 'meta', render: data => (data["type"]? data["type"]:"") + (data["offpeak"]? " (offpeak)":"")},
             { data: 'status' },
             { data: 'created_at', render: data => `<span style="display:none;">${data || Date.now()  }</span>`+(data? new Date(data).toLocaleString("en-US"):"")},
             { data: 'parameters', render: data => data["accession"] || ""},
@@ -169,13 +185,32 @@ <h1 class="title">DICOM Query</h1>
         },
         // filter: true,
         buttons: [
+        {
+                    extend: "customEnable",
+                    text: '<i class="fas fa-sync"></i>',
+                    titleAttr: 'test',
+                    enabled: function(dt, node, config) {
+                      let data = dt.row({selected: true}).data();
+                      if (!data) {
+                          return false;
+                      }
+                      return data.status == "failed"
+                    },
+                    action: function ( e, dt, node, config ) {
+                      let data = dt.row({selected: true}).data();
+                      fetch(`query/retry_job?id=${data.id}`, {method:"POST"}).then(()=>{
+                            dt.ajax.reload()
+                        }).catch((err)=>{
+                            console.log("Error: ", err)
+                        })
+                    }
+          },
           {
                     extend: "customEnable",
                     text: '<i class="fas fa-pause"></i>',
                     titleAttr: 'Pause/Resume',
                     enabled: function(dt, node, config) {
                       let data = dt.row({selected: true}).data();
-                      console.log(node);
                       if (!data) {
                           return false;
                       }

From bee55ab7d32f409457566ae3c581d0172c048d67 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Wed, 12 Jun 2024 21:55:49 +0000
Subject: [PATCH 06/42] fixes

---
 webinterface/dashboards/query.py             | 14 +++++++-------
 webinterface/templates/dashboards/query.html |  8 ++++----
 2 files changed, 11 insertions(+), 11 deletions(-)

diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
index ddd4dc6c..cd682818 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query.py
@@ -379,13 +379,13 @@ async def query_jobs(request):
             else:
                 job_dict["status"] = "paused"
 
-        # if job_dict["status"] in ("deferred", "started"):
-            # if n_started == 0:
-            #     job_dict["status"] = "waiting"
-            # elif n_completed < n_total:
-            #     job_dict["status"] = "running"
-            # elif n_completed == n_total:
-            #     job_dict["status"] = "finishing"
+        if job_dict["status"] in ("deferred", "started"):
+            if n_started == 0:
+                job_dict["status"] = "waiting"
+            elif n_completed < n_total:
+                job_dict["status"] = "running" 
+            elif n_completed == n_total:
+                job_dict["status"] = "finishing" 
 
         job_info.append(job_dict)
     return JSONResponse(dict(data=job_info))
diff --git a/webinterface/templates/dashboards/query.html b/webinterface/templates/dashboards/query.html
index 45ad8f5b..f34a459d 100644
--- a/webinterface/templates/dashboards/query.html
+++ b/webinterface/templates/dashboards/query.html
@@ -187,7 +187,7 @@ <h1 class="title">DICOM Query</h1>
         buttons: [
         {
                     extend: "customEnable",
-                    text: '<i class="fas fa-sync"></i>',
+                    text: '<i class="fas fa-sync"></i>&nbsp;Retry',
                     titleAttr: 'test',
                     enabled: function(dt, node, config) {
                       let data = dt.row({selected: true}).data();
@@ -207,7 +207,7 @@ <h1 class="title">DICOM Query</h1>
           },
           {
                     extend: "customEnable",
-                    text: '<i class="fas fa-pause"></i>',
+                    text: '<i class="fas fa-pause"></i>&nbsp;Pause',
                     titleAttr: 'Pause/Resume',
                     enabled: function(dt, node, config) {
                       let data = dt.row({selected: true}).data();
@@ -215,9 +215,9 @@ <h1 class="title">DICOM Query</h1>
                           return false;
                       }
                       if (data.status == "paused") {
-                        node.html('<i class="fas fa-play"></i>')
+                        node.html('<i class="fas fa-play"></i>&nbsp;Resume')
                       } else {
-                        node.html('<i class="fas fa-pause"></i>')
+                        node.html('<i class="fas fa-pause"></i>&nbsp;Pause')
                       }
                       return (data.status == "paused" || data.status == "deferred" || data.status == "queued" || data.status == "running");
                     },

From 8557a5434db00d749f956917e67d6aecad519e77 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 14 Jun 2024 21:49:53 +0000
Subject: [PATCH 07/42] query: refactor, check to see if all accessions exist
 first, show failure reasons, move accession to destination as received

---
 webinterface/dashboards/query.py | 209 +++++++++++++++++--------------
 webinterface/query.py            |   2 +-
 2 files changed, 118 insertions(+), 93 deletions(-)

diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
index cd682818..9cdc0156 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query.py
@@ -23,112 +23,132 @@
 
 
 
-def query_job(*,accession, node):
+def get_accession_job(job_id, job_kwargs):
+    accession, node, path = job_kwargs["accession"], job_kwargs["node"], job_kwargs["path"]
     config.read_config()
-    c = SimpleDicomClient(node.ip, node.port, node.aet_target, config.mercure.incoming_folder)
-    job = get_current_job()
-    job.meta["started"] = 1
-    job.save_meta()
+    c = SimpleDicomClient(node.ip, node.port, node.aet_target, path)
+    # job = get_current_job()
+    # job.meta["started"] = 1
+    # job.save_meta()
     for identifier in c.getscu(accession):
-        job.meta['failed'] = identifier.NumberOfFailedSuboperations
-        job.meta['remaining'] = identifier.NumberOfRemainingSuboperations
-        job.meta['completed'] = identifier.NumberOfCompletedSuboperations
-        if not job.meta.get('total', False):
-            job.meta['total'] = identifier.NumberOfCompletedSuboperations + identifier.NumberOfRemainingSuboperations
-        job.meta["started"] += 1
-        job.save_meta()
+        completed, remaining = identifier.NumberOfCompletedSuboperations, identifier.NumberOfRemainingSuboperations, 
+        progress = f"{ completed } / { completed + remaining }"
+        yield completed, remaining, progress
     return "Complete"
 
-
-def dummy_job(*,accession, node, path):
-    print(f"Getting {accession}")
-    job = get_current_job()
+def check_accessions_exist(*, accessions, node):
+    c = SimpleDicomClient(node.ip, node.port, node.aet_target, None)
     try:
-        Path(path).mkdir(parents=True, exist_ok=True)
-        total_time = 10  # Total time for the job in seconds (1 minute)
-        update_interval = 1  # Interval between updates in seconds
-
-        start_time = time.monotonic()
-        if job.meta.get('parent'):
-            job_parent = worker_queue.fetch_job(job.meta['parent'])
-        else:
-            job_parent = None
-        # failed = 0
-        remaining = total_time // update_interval
-        completed = 0
-
-        if job_parent:
-            job_parent.meta['started'] = job_parent.meta.get('started',0) + 1
-            job_parent.save_meta()
-
-        job.meta['started'] = 1
-        job.meta['total'] = remaining
-        job.meta['progress'] = f"0 / {job.meta['total']}"
-        job.save_meta()
-        while (time.monotonic() - start_time) < total_time:
-            time.sleep(update_interval)  # Sleep for the interval duration
-            out_file = (Path(path) / f"dummy{completed}_{job.id}.dcm")
-            if out_file.exists():
-                raise Exception(f"{out_file} exists already")
-            out_file.touch()
-            remaining -= 1
-            completed += 1
-
-            # job.meta['failed'] = failed
-            job.meta['remaining'] = remaining
-            job.meta['completed'] = completed
-            job.meta['progress'] = f"{completed} / {job.meta['total']}"
-            print(job.meta['progress'])
-            job.save_meta()  # Save the updated meta data to the job
-        
-        if job_parent:
-            job_parent.get_meta() # there is technically a race condition here...
-            job_parent.meta['completed'] += 1
-            job_parent.meta['progress'] = f"{job_parent.meta['started'] } / {job_parent.meta['completed'] } / {job_parent.meta['total']}"
-
-            job_parent.save_meta()
+        for accession in accessions:
+            result = c.findscu(accession)
+            logger.info(result)
     except:
-        if not job_parent:
-            raise
-        # Cancel remaining sibling jobs
-        logger.info("Cancelling sibling jobs.")
-        for subjob_id in job_parent.kwargs.get('subjobs',[]):
-            if subjob_id == job.id:
-                continue
-            subjob = worker_queue.fetch_job(subjob_id)
-            if subjob.get_status() not in ('finished', 'canceled','failed'):
-                subjob.cancel()
-        job_parent.get_meta() 
-        logger.info("Cancelled sibling jobs.")
-        worker_queue._enqueue_job(job_parent) # Force the parent job to run and fail itself
+        job = get_current_job()
+        job_parent = worker_queue.fetch_job(job.meta.get('parent'))
+        job_parent.meta['failed_reason'] = f"Accession {accession} not found on node"
+        worker_queue._enqueue_job(job_parent,at_front=True)
         raise
+def query_dummy(job_id, job_kwargs):
+    total_time = 2  # Total time for the job in seconds (1 minute)
+    update_interval = 0.25  # Interval between updates in seconds
+    remaining = total_time // update_interval
+    completed = 0
+    start_time = time.monotonic()
+
+    while (time.monotonic() - start_time) < total_time:
+        time.sleep(update_interval)  # Sleep for the interval duration
+        out_file = (Path(job_kwargs['path']) / f"dummy{completed}_{job_id}.dcm")
+        if out_file.exists():
+            raise Exception(f"{out_file} exists already")
+        out_file.touch()
+        remaining -= 1
+        completed += 1
+
+        yield completed, remaining, f"{completed} / {remaining + completed}"
+
+class QueryJob():
+
+    @classmethod
+    def get_accessions(cls, *,accession, node, path, perform_func=query_dummy):
+        print(f"Getting {accession}")
+        job = get_current_job()
+        try:
+            Path(path).mkdir(parents=True, exist_ok=True)
+            job_parent = None
+            if parent_id := job.meta.get('parent'):
+                job_parent = worker_queue.fetch_job(parent_id)
+
+            if job_parent:
+                job_parent.meta['started'] = job_parent.meta.get('started',0) + 1
+                job_parent.save_meta()
+
+            job.meta['started'] = 1
+            job.meta['progress'] = "0 / Unknown"
+            job.save_meta()
+            for completed, remaining, progress in perform_func(job.id, job.kwargs):
+                job.meta['remaining'] = remaining
+                job.meta['completed'] = completed
+                job.meta['progress'] = progress
+                job.save_meta()  # Save the updated meta data to the job
+                logger.info(progress)
+            if job_parent.kwargs["move_promptly"]:
+                move_to_destination(path, job_parent.kwargs["destination"], job_parent.id)
+            if job_parent:
+                job_parent.get_meta() # there is technically a race condition here...
+                job_parent.meta['completed'] += 1
+                job_parent.meta['progress'] = f"{job_parent.meta['started'] } / {job_parent.meta['completed'] } / {job_parent.meta['total']}"
+                job_parent.save_meta()
+        except:
+            if not job_parent:
+                raise
+            # Cancel remaining sibling jobs
+            logger.info("Cancelling sibling jobs.")
+            for subjob_id in job_parent.kwargs.get('subjobs',[]):
+                if subjob_id == job.id:
+                    continue
+                subjob = worker_queue.fetch_job(subjob_id)
+                if subjob.get_status() not in ('finished', 'canceled','failed'):
+                    subjob.cancel()
+            job_parent.get_meta() 
+            logger.info("Cancelled sibling jobs.")
+            job_parent.meta["failed_reason"] = f"Failed to retrieve {accession}"
+            worker_queue._enqueue_job(job_parent,at_front=True) # Force the parent job to run and fail itself
+            raise
 
-    return "Job complete"
+        return "Job complete"
 
-def batch_job(*, accessions, subjobs, path, destination):
+def move_to_destination(path, destination, job_id):
+    if destination is None:
+        config.read_config()
+        for p in Path(path).glob("**/*"):
+            if p.is_file():
+                shutil.move(p, config.mercure.incoming_folder)
+        shutil.rmtree(path)
+    else:
+        dest_folder: Path = Path(destination) / job_id
+        dest_folder.mkdir(exist_ok=True)
+        logger.info(f"moving {path} to {dest_folder}")
+        shutil.move(path, dest_folder)
+
+def batch_job(*, accessions, subjobs, path, destination, move_promptly):
     job = get_current_job()
     job.get_meta()
     for job_id in job.kwargs.get('subjobs',[]):
         subjob = worker_queue.fetch_job(job_id)
         if (status := subjob.get_status()) != 'finished':
             raise Exception(f"Subjob {subjob.id} is {status}")
+        if job.kwargs.get('failed', False):
+            raise Exception(f"Failed")
 
     logger.info(f"Job completing {job.id}")
-    logger.info(path)
-    config.read_config()
-    if destination is None:
-        for p in Path(path).glob("**/*"):
-            if p.is_file():
-                shutil.move(p, config.mercure.incoming_folder)
-    else:
-        dest_folder: Path = Path(destination) / job.id
-        dest_folder.mkdir()
-        for p in Path(path).iterdir():
-            if p.is_dir():
-                logger.info(f"moving {p} to {dest_folder}")
-                shutil.move(p, dest_folder)
 
+    if not move_promptly:
+        for p in Path(path).iterdir():
+            if not p.is_dir():
+                continue
+            move_to_destination(p, destination, job.id)
     shutil.rmtree(path)
+
     return "Job complete"
 
 
@@ -161,19 +181,24 @@ def resume_job(job: Job):
 def create_job(accessions, dicom_node, destination_path, offpeak=False) -> Job:
     with Connection(redis):
         jobs = []
+        check_job = Job.create(check_accessions_exist, kwargs=dict(accessions=accessions,node=dicom_node), meta=dict(parent=None))
+
         for accession in accessions:
-            job = Job.create(dummy_job, kwargs=dict(accession=accession, node=dicom_node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_batch",parent=None, paused=False, offpeak=offpeak))
+            job = Job.create(QueryJob.get_accessions, kwargs=dict(perform_func=get_accession_job, accession=accession, node=dicom_node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_batch",parent=None, paused=False, offpeak=offpeak),depends_on=[check_job])
             jobs.append(job)
         depends = Dependency(
             jobs=jobs,
             allow_failure=True,    # allow_failure defaults to False
         )
-        full_job = Job.create(batch_job, kwargs=dict(accessions=accessions, subjobs=[j.id for j in jobs], destination=destination_path), timeout=-1, result_ttl=-1, meta=dict(type="batch", started=0, paused=False,completed=0, total=len(jobs), offpeak=offpeak), depends_on=depends)
+        full_job = Job.create(batch_job, kwargs=dict(accessions=accessions, subjobs=[j.id for j in jobs], destination=destination_path, move_promptly=True), timeout=-1, result_ttl=-1, meta=dict(type="batch", started=0, paused=False,completed=0, total=len(jobs), offpeak=offpeak), depends_on=depends)
+        check_job.meta["parent"] = full_job.id
         for j in jobs:
             j.meta["parent"] = full_job.id
             j.kwargs["path"] = f"/opt/mercure/data/query/job_dirs/{full_job.id}/{j.kwargs['accession']}"
         full_job.kwargs["path"] = Path(f"/opt/mercure/data/query/job_dirs/{full_job.id}")
         full_job.kwargs["path"].mkdir(parents=True)
+
+    worker_queue.enqueue_job(check_job)
     for j in jobs:
         worker_queue.enqueue_job(j)
     worker_queue.enqueue_job(full_job)
@@ -325,9 +350,9 @@ async def query_post_batch(request):
             dest_path = d.path
             break
 
-    random_accessions = ["".join(random.choices([str(i) for i in range(10)], k=10)) for _ in range(3)]
+    # random_accessions = ["".join(random.choices([str(i) for i in range(10)], k=10)) for _ in range(3)]
     offpeak = 'offpeak' in form
-    create_job(random_accessions, node, dest_path, offpeak=offpeak)
+    create_job(form.get("accession").split(","), node, dest_path, offpeak=offpeak)
     # worker_scheduler.schedule(scheduled_time=datetime.utcnow(), func=monitor_job, interval=10, repeat=10, result_ttl=-1)
     return PlainTextResponse()
 
@@ -357,7 +382,7 @@ async def query_jobs(request):
                                 parameters=dict(accession=job.kwargs.get('accession','')), 
                                 created_at=1000*datetime.timestamp(job.created_at) if job.created_at else "",
                                 enqueued_at=1000*datetime.timestamp(job.enqueued_at) if job.enqueued_at else "", 
-                                result=job.result, 
+                                result=job.result if job.get_status() != "failed" else job.meta.get("failed_reason",""), 
                                 meta=job.meta,
                                 progress="")
         # if job.meta.get('completed') and job.meta.get('remaining'):
diff --git a/webinterface/query.py b/webinterface/query.py
index fa1077e2..40187abb 100644
--- a/webinterface/query.py
+++ b/webinterface/query.py
@@ -183,7 +183,7 @@ def getscu(self, accession_number):
 
     def findscu(self,accession_number):
         # Create application entity
-        ae = AE(ae_title=calling_aet)
+        ae = AE(ae_title="MERCURE")
 
         # Add a requested presentation context
         # ae.add_requested_context(StudyRootQueryRetrieveInformationModelFind)

From e260d04744eb6bc17d8b013b598c5d9d47d16556 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Thu, 27 Jun 2024 01:21:34 +0000
Subject: [PATCH 08/42] when evaluating rules, keep track of accessed tags

---
 common/rule_evaluation.py     |  8 ++++---
 common/tags_rule_interface.py | 33 ++++++++++++++++++---------
 webinterface/rules.py         | 42 +++++++++++++++++++++++------------
 3 files changed, 56 insertions(+), 27 deletions(-)

diff --git a/common/rule_evaluation.py b/common/rule_evaluation.py
index 25ccd1d7..2c3a3bbe 100755
--- a/common/rule_evaluation.py
+++ b/common/rule_evaluation.py
@@ -55,19 +55,21 @@ def eval_rule(rule: str, tags: Dict[str, str]) -> Any:
     rule = replace_tags(rule, tags)
     logger.info(f"Evaluated: {rule}")
     try:
-        result = eval(rule, {"__builtins__": {}}, {**safe_eval_cmds,"tags":Tags(tags)})
+        tags = Tags(tags)
+        result = eval(rule, {"__builtins__": {}}, {**safe_eval_cmds,"tags":tags})
     except SyntaxError as e:
         opening = rule.find("@")
         closing = rule.find("@",opening+1)
         if opening >-1 and closing>1:
             raise TagNotFoundException(f"No such tag '{rule[opening+1:closing]}' in tags list.")
         raise
+    logger.info(", ".join([f"{tag} = \"{tags[tag]}\"" for tag in tags._attrs_accessed()]))
     logger.info(f"Result: {result}")
-    return result
+    return result, tags._attrs_accessed()
 
 def parse_rule(rule: str, tags: Dict[str, str]) -> Tuple[bool,Optional[str], Optional[str]]:
     try: 
-        result = eval_rule(rule, tags)
+        result, _ = eval_rule(rule, tags)
         return True if result else False, result, None
     except TagNotFoundException:
         return False, None, None
diff --git a/common/tags_rule_interface.py b/common/tags_rule_interface.py
index 61b1507a..4dddda0c 100644
--- a/common/tags_rule_interface.py
+++ b/common/tags_rule_interface.py
@@ -1,31 +1,44 @@
 class Tags:
+    _tags_dict = None
+    _tags_accessed = None
+
     def __init__(self, input_dict) -> None:
-        self._dict = input_dict
+        self._tags_dict = input_dict
+        self._tags_accessed = set()
+
+    def tags_accessed(self):
+        return self._tags_accessed
 
     def __getattr__(self, name):
-        if name in self._dict:
-            return self._dict[name]
+        if name in self.__dict__:
+            return self.__dict__[name]
+
+        if name in self._tags_dict:
+            self._tags_accessed.add(name)
+            return self._tags_dict[name]
         else:
             lowered_name = name.lower()
-            for k in self._dict:
+            for k in self._tags_dict:
                 if k.lower() == lowered_name:
-                    return self._dict[k]
+                    self._tags_accessed.add(k)
+                    return self._tags_dict[k]
             raise TagNotFoundException(f"No such tag '{name}' in tags list.")
 
     def __getitem__(self, name):
-        if name in self._dict:
-            return self._dict[name]
+        if name in self._tags_dict:
+            self._tags_accessed.add(name)
+            return self._tags_dict[name]
         else:
             raise TagNotFoundException(f"No such tag '{name}' in tags list.")
 
     def __len__(self):
-        return len(self._dict)
+        return len(self._tags_dict)
 
     def __iter__(self):
-        return iter(self._dict)
+        return iter(self._tags_dict)
 
     def __contains__(self, name):
-        return name in self._dict
+        return name in self._tags_dict
 
 class TagNotFoundException(Exception):
     pass
\ No newline at end of file
diff --git a/webinterface/rules.py b/webinterface/rules.py
index 39c011b5..453964e9 100755
--- a/webinterface/rules.py
+++ b/webinterface/rules.py
@@ -252,6 +252,8 @@ async def rules_delete_post(request) -> Response:
 @requires(["authenticated", "admin"], redirect="login")
 async def rules_test(request) -> Response:
     """Evalutes if a given routing rule is valid. The rule and testing dictionary have to be passed as form parameters."""
+    noresult = set()
+    attrs_accessed = set()
     try:
         form = dict(await request.form())
         testrule = form["rule"]
@@ -261,24 +263,36 @@ async def rules_test(request) -> Response:
             '<span class="tag is-warning is-medium ruleresult"><i class="fas fa-bug"></i>&nbsp;Error</span>&nbsp;&nbsp;Invalid test values'
         )
     try:
-        result = rule_evaluation.eval_rule(testrule, testvalues)
+        result, attrs_accessed = rule_evaluation.eval_rule(testrule, testvalues)
+    
         if result:
-            return PlainTextResponse(
-                f'<span class="tag is-success is-medium ruleresult"><i class="fas fa-thumbs-up"></i>&nbsp;Trigger</span>' + (f'<pre style="display:inline; margin-left: 1em">{result}</pre>' if result is not True else '')
-            )
+            style = "success"
+            icon = "thumbs-up"
+            text = "Trigger"
+            inline = result if result is not True else noresult
         else:
-            return PlainTextResponse(
-                f'<span class="tag is-info is-medium ruleresult"><i class="fas fa-thumbs-down"></i>&nbsp;Reject</span>' + (f'<pre style="display:inline; margin-left: 1em">{result}</pre>' if result is not False else '')
-            )
+            style = "info"
+            icon = "thumbs-down"
+            text = "Reject"
+            inline = result if result is not False else noresult
+
     except TagNotFoundException as e:
-        return PlainTextResponse(
-                f'<span class="tag is-info is-medium ruleresult"><i class="fas fa-thumbs-down"></i>&nbsp;Reject</span><span>{e}</span>'
-            )
-    except Exception as e:
-        return PlainTextResponse(
-            f'<span class="tag is-danger is-medium ruleresult"><i class="fas fa-bug"></i>&nbsp;Error</span>&nbsp;&nbsp;Invalid rule: <pre style="display:inline; margin-left: 1em">{e}</pre>'
-        )
+        style = "info"
+        icon = "thumbs-down"
+        text = "Reject"
+        inline = e
 
+    except Exception as e:
+        style = "danger"
+        icon = "bug"
+        text = "Error"
+        inline = e
+
+    attrs_accessed_info = "\n".join([f"{x} = \"{testvalues[x]}\"" for x in attrs_accessed]) if len(attrs_accessed) > 0 else None
+    return PlainTextResponse(f'<span class="tag is-{style} is-medium ruleresult"><i class="fas fa-{icon}"></i>&nbsp;{text}</span>'
+                             + (f'<pre style="display:inline; margin-left: 1em">{repr(inline) if not isinstance(inline,Exception) else str(inline) }</pre>' if inline is not noresult else '')
+                             + (f'<pre style="margin: 1em">Tags evaluated:\n{attrs_accessed_info}</pre>' if attrs_accessed_info else '')
+                             )
 
 @router.post("/test_completionseries")
 @requires(["authenticated", "admin"], redirect="login")

From a11f46a9858f5e5f178172af5fc787b8ed0c2e6c Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Thu, 27 Jun 2024 23:58:11 +0000
Subject: [PATCH 09/42] add manage.py utility

---
 manage.py | 72 +++++++++++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 72 insertions(+)
 create mode 100755 manage.py

diff --git a/manage.py b/manage.py
new file mode 100755
index 00000000..ac02f70a
--- /dev/null
+++ b/manage.py
@@ -0,0 +1,72 @@
+#!/usr/bin/env python
+import click
+import webinterface.users as users
+@click.group()
+def manage():
+    """
+    Management commands for Mercure.
+    """
+    pass
+
+@click.group()
+def user():
+    """User management commands."""
+    pass
+
+@click.command()
+@click.argument('username')
+@click.option('--admin', is_flag=True, help='Make the user an admin.')
+def add(username, admin: bool):
+    """Add a new user."""
+    if username in users.users_list:
+        click.echo("User already exists.")
+        return
+    password_input = click.prompt("Enter password", hide_input=True, confirmation_prompt=True)
+    users.users_list[username] = {"password": users.hash_password(password_input), "is_admin": "True" if admin else "False"}
+    users.save_users()
+    click.echo("User added successfully.")
+
+@click.command()
+def list():
+    """List all users."""
+    for user in users.users_list:
+        click.echo(user)
+
+@click.command()
+@click.argument('username')
+def delete(username):
+    """Delete a user"""
+    if username in users.users_list:
+        del users.users_list[username]
+        users.save_users()
+        click.echo("User deleted.")
+    else:
+        click.echo("User does not exist.")
+
+
+@click.command()
+@click.argument('username')
+def set_password(username):
+    """Update a user's password"""
+    user = users.users_list.get(username)
+    if not user:
+        click.echo("User does not exist.")
+        return
+    new_password = click.prompt("Enter the new password", hide_input=True, confirmation_prompt=True)
+    user['password'] = users.hash_password(new_password)
+    users.save_users()
+    click.echo("Password updated successfully.")
+
+# Adding commands to the user group
+user.add_command(add)
+user.add_command(delete)
+user.add_command(list)
+user.add_command(set_password)
+
+# Adding the user group to the main CLI group
+manage.add_command(user)
+
+if __name__ == '__main__':
+    users.logger.setLevel('ERROR')
+    users.read_users()
+    manage()
\ No newline at end of file

From 161e424d2a760fb0123090a78981d1aed56c0537 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 28 Jun 2024 00:00:48 +0000
Subject: [PATCH 10/42] add workflow to check getdcmtags version

---
 .github/workflows/pythonapp.yml |  3 +++
 getdcmtags/check_version.sh     | 15 +++++++++++++++
 2 files changed, 18 insertions(+)
 create mode 100755 getdcmtags/check_version.sh

diff --git a/.github/workflows/pythonapp.yml b/.github/workflows/pythonapp.yml
index be321a9c..ee7fa8c2 100755
--- a/.github/workflows/pythonapp.yml
+++ b/.github/workflows/pythonapp.yml
@@ -37,3 +37,6 @@ jobs:
     - name: Test with pytest
       run: |
         python -m pytest -vvv tests
+    - name: Check getdcmtags version
+      run: |
+        cd getdcmtags && ./check_version.sh
diff --git a/getdcmtags/check_version.sh b/getdcmtags/check_version.sh
new file mode 100755
index 00000000..1ca20ce7
--- /dev/null
+++ b/getdcmtags/check_version.sh
@@ -0,0 +1,15 @@
+#!/usr/bin/env bash
+
+binary_version=$(../bin/ubuntu22.04/getdcmtags --version | grep -oP 'Version \K.*' )
+source_version=$(grep -oP '#define VERSION "\K.*(?=")' ../getdcmtags/main.cpp)
+
+echo "Binary version: $binary_version"
+echo "Source version: $source_version"
+echo ""
+if [ "$binary_version" == "$source_version" ]; then
+    echo "Versions match."
+    exit 0
+else
+    echo "Versions do not match!"
+    exit 1
+fi
\ No newline at end of file

From b9795128da76d0533aa196552c6c222507e97a75 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 28 Jun 2024 00:01:06 +0000
Subject: [PATCH 11/42] satisfy mypy

---
 common/rule_evaluation.py        |  10 +-
 common/tags_rule_interface.py    |   9 +-
 tests/test_notifications.py      |   1 +
 tests/test_processor.py          |   5 +-
 tests/test_query.py              |   5 +
 tests/test_router.py             |   6 +-
 webinterface/dashboards/query.py | 153 ++++++++++++++++++++-----------
 webinterface/query.py            |  18 ++--
 webinterface/rules.py            |   4 +-
 9 files changed, 135 insertions(+), 76 deletions(-)
 create mode 100644 tests/test_query.py

diff --git a/common/rule_evaluation.py b/common/rule_evaluation.py
index 2c3a3bbe..529af76c 100755
--- a/common/rule_evaluation.py
+++ b/common/rule_evaluation.py
@@ -48,14 +48,14 @@ def replace_tags(rule: str, tags: Dict[str, str]) -> Any:
 safe_eval_cmds = {"float": float, "int": int, "str": str}
 
 
-def eval_rule(rule: str, tags: Dict[str, str]) -> Any:
+def eval_rule(rule: str, tags_dict: Dict[str, str]) -> Any:
     """Parses the given rule, replaces all tag variables with values from the given tags dictionary, and
     evaluates the rule. If the rule is invalid, an exception will be raised."""
     logger.info(f"Rule: {rule}")
-    rule = replace_tags(rule, tags)
+    rule = replace_tags(rule, tags_dict)
     logger.info(f"Evaluated: {rule}")
     try:
-        tags = Tags(tags)
+        tags = Tags(tags_dict)
         result = eval(rule, {"__builtins__": {}}, {**safe_eval_cmds,"tags":tags})
     except SyntaxError as e:
         opening = rule.find("@")
@@ -63,9 +63,9 @@ def eval_rule(rule: str, tags: Dict[str, str]) -> Any:
         if opening >-1 and closing>1:
             raise TagNotFoundException(f"No such tag '{rule[opening+1:closing]}' in tags list.")
         raise
-    logger.info(", ".join([f"{tag} = \"{tags[tag]}\"" for tag in tags._attrs_accessed()]))
+    logger.info(", ".join([f"{tag} = \"{tags_dict[tag]}\"" for tag in tags.tags_accessed()]))
     logger.info(f"Result: {result}")
-    return result, tags._attrs_accessed()
+    return result, tags.tags_accessed()
 
 def parse_rule(rule: str, tags: Dict[str, str]) -> Tuple[bool,Optional[str], Optional[str]]:
     try: 
diff --git a/common/tags_rule_interface.py b/common/tags_rule_interface.py
index 4dddda0c..a3d35587 100644
--- a/common/tags_rule_interface.py
+++ b/common/tags_rule_interface.py
@@ -1,12 +1,15 @@
+from typing import Dict, Set
+
+
 class Tags:
-    _tags_dict = None
-    _tags_accessed = None
+    _tags_dict: Dict[str,str] = {}
+    _tags_accessed: Set[str] = set()
 
     def __init__(self, input_dict) -> None:
         self._tags_dict = input_dict
         self._tags_accessed = set()
 
-    def tags_accessed(self):
+    def tags_accessed(self) -> Set[str]:
         return self._tags_accessed
 
     def __getattr__(self, name):
diff --git a/tests/test_notifications.py b/tests/test_notifications.py
index 36c717e0..c6d5b9f4 100644
--- a/tests/test_notifications.py
+++ b/tests/test_notifications.py
@@ -18,6 +18,7 @@
 import unittest.mock
 import itertools
 from typing import Iterator, Callable
+import pytest
 
 logger = config.get_logger()
 
diff --git a/tests/test_processor.py b/tests/test_processor.py
index a0dd9403..8ed6897a 100755
--- a/tests/test_processor.py
+++ b/tests/test_processor.py
@@ -12,20 +12,18 @@
 import common
 from common.monitor import task_event
 
-import process.process_series
 import router
-import daiquiri
 import processor
 from common.constants import mercure_version
 
 import json
-from pprint import pprint
 from common.types import *
 import routing
 import routing.generate_taskfile
 from pathlib import Path
 
 from testing_common import *
+from testing_common import mock_task_ids
 
 from docker.models.containers import ContainerCollection
 
@@ -34,6 +32,7 @@
 import socket
 
 from typing import Callable
+import pytest
 
 logger = config.get_logger()
 
diff --git a/tests/test_query.py b/tests/test_query.py
new file mode 100644
index 00000000..975cabc3
--- /dev/null
+++ b/tests/test_query.py
@@ -0,0 +1,5 @@
+from testing_common import *
+from pyfakefs.fake_filesystem import FakeFilesystem
+
+def test_query(fs: FakeFilesystem, mercure_config, mocked):
+    pass
\ No newline at end of file
diff --git a/tests/test_router.py b/tests/test_router.py
index 04ee5664..0bfe69dc 100755
--- a/tests/test_router.py
+++ b/tests/test_router.py
@@ -25,6 +25,8 @@
 
 from testing_common import *
 
+from testing_common import mock_task_ids
+
 # import common.config as config
 
 rules = {
@@ -96,7 +98,7 @@ def test_route_series_fail2(fs: FakeFilesystem, mercure_config, mocked):
         severity.ERROR,
         "Invalid rule encountered:  1/0 ",
     )
-    common.monitor.send_task_event.assert_any_call(task_event.DISCARD, task_id,1, "","Discard by default.")
+    common.monitor.send_task_event.assert_any_call(task_event.DISCARD, task_id,1, "","Discard by default.")  # type: ignore
     common.monitor.send_task_event.reset_mock()  # type: ignore
 
 
@@ -383,7 +385,7 @@ async def test_route_series_fail_with_bad_tags(fs: FakeFilesystem, mercure_confi
     common.monitor.send_register_task.assert_any_call(task_id, series_uid)  # type: ignore
     router.route_series.assert_called_once_with(task_id, series_uid)  # type: ignore
 
-    common.monitor.send_task_event.assert_any_call(task_event.DISCARD, task_id,1, "","Discard by default. Decoding error detected: some tags were not properly decoded, likely due to a malformed DICOM file. The expected rule may therefore not have been triggered.")
+    common.monitor.send_task_event.assert_any_call(task_event.DISCARD, task_id,1, "","Discard by default. Decoding error detected: some tags were not properly decoded, likely due to a malformed DICOM file. The expected rule may therefore not have been triggered.")  # type: ignore
 
 
 
diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
index 9cdc0156..d459ae6a 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query.py
@@ -1,6 +1,7 @@
 
 from pathlib import Path
 import shutil
+from typing import Generator, List, Union, cast
 from webinterface.query import SimpleDicomClient
 # Standard python includes
 from datetime import datetime
@@ -24,19 +25,25 @@
 
 
 def get_accession_job(job_id, job_kwargs):
+    """
+    
+    """
     accession, node, path = job_kwargs["accession"], job_kwargs["node"], job_kwargs["path"]
     config.read_config()
     c = SimpleDicomClient(node.ip, node.port, node.aet_target, path)
     # job = get_current_job()
     # job.meta["started"] = 1
-    # job.save_meta()
+    # job.save_meta() # type: ignore
     for identifier in c.getscu(accession):
         completed, remaining = identifier.NumberOfCompletedSuboperations, identifier.NumberOfRemainingSuboperations, 
-        progress = f"{ completed } / { completed + remaining }"
+        progress = f"{ completed } / { completed + remaining }" 
         yield completed, remaining, progress
     return "Complete"
 
-def check_accessions_exist(*, accessions, node):
+def check_accessions_exist(*, accessions, node, queue=worker_queue):
+    """
+    Check if the given accessions exist on the node using a DICOM query.
+    """
     c = SimpleDicomClient(node.ip, node.port, node.aet_target, None)
     try:
         for accession in accessions:
@@ -44,11 +51,16 @@ def check_accessions_exist(*, accessions, node):
             logger.info(result)
     except:
         job = get_current_job()
-        job_parent = worker_queue.fetch_job(job.meta.get('parent'))
+        if not job:
+            raise Exception("No current job found")
+        job_parent = queue.fetch_job(job.meta.get('parent'))
         job_parent.meta['failed_reason'] = f"Accession {accession} not found on node"
-        worker_queue._enqueue_job(job_parent,at_front=True)
+        queue._enqueue_job(job_parent,at_front=True)
         raise
 def query_dummy(job_id, job_kwargs):
+    """
+    Dummy function to simulate a long-running task.
+    """
     total_time = 2  # Total time for the job in seconds (1 minute)
     update_interval = 0.25  # Interval between updates in seconds
     remaining = total_time // update_interval
@@ -69,14 +81,16 @@ def query_dummy(job_id, job_kwargs):
 class QueryJob():
 
     @classmethod
-    def get_accessions(cls, *,accession, node, path, perform_func=query_dummy):
+    def get_accessions(cls, *,accession, node, path, perform_func=query_dummy,queue=worker_queue):
         print(f"Getting {accession}")
         job = get_current_job()
+        if not job:
+            raise Exception("No current job")
         try:
             Path(path).mkdir(parents=True, exist_ok=True)
             job_parent = None
             if parent_id := job.meta.get('parent'):
-                job_parent = worker_queue.fetch_job(parent_id)
+                job_parent = queue.fetch_job(parent_id)
 
             if job_parent:
                 job_parent.meta['started'] = job_parent.meta.get('started',0) + 1
@@ -84,12 +98,12 @@ def get_accessions(cls, *,accession, node, path, perform_func=query_dummy):
 
             job.meta['started'] = 1
             job.meta['progress'] = "0 / Unknown"
-            job.save_meta()
+            job.save_meta() # type: ignore
             for completed, remaining, progress in perform_func(job.id, job.kwargs):
                 job.meta['remaining'] = remaining
                 job.meta['completed'] = completed
                 job.meta['progress'] = progress
-                job.save_meta()  # Save the updated meta data to the job
+                job.save_meta() # type: ignore  # Save the updated meta data to the job
                 logger.info(progress)
             if job_parent.kwargs["move_promptly"]:
                 move_to_destination(path, job_parent.kwargs["destination"], job_parent.id)
@@ -106,23 +120,26 @@ def get_accessions(cls, *,accession, node, path, perform_func=query_dummy):
             for subjob_id in job_parent.kwargs.get('subjobs',[]):
                 if subjob_id == job.id:
                     continue
-                subjob = worker_queue.fetch_job(subjob_id)
+                subjob = queue.fetch_job(subjob_id)
                 if subjob.get_status() not in ('finished', 'canceled','failed'):
                     subjob.cancel()
             job_parent.get_meta() 
             logger.info("Cancelled sibling jobs.")
             job_parent.meta["failed_reason"] = f"Failed to retrieve {accession}"
-            worker_queue._enqueue_job(job_parent,at_front=True) # Force the parent job to run and fail itself
+            queue._enqueue_job(job_parent,at_front=True) # Force the parent job to run and fail itself
             raise
 
         return "Job complete"
 
-def move_to_destination(path, destination, job_id):
+def move_to_destination(path, destination, job_id) -> None:
+    """
+
+    """
     if destination is None:
         config.read_config()
         for p in Path(path).glob("**/*"):
             if p.is_file():
-                shutil.move(p, config.mercure.incoming_folder)
+                shutil.move(str(p), config.mercure.incoming_folder) # Move the file to incoming folder
         shutil.rmtree(path)
     else:
         dest_folder: Path = Path(destination) / job_id
@@ -130,11 +147,13 @@ def move_to_destination(path, destination, job_id):
         logger.info(f"moving {path} to {dest_folder}")
         shutil.move(path, dest_folder)
 
-def batch_job(*, accessions, subjobs, path, destination, move_promptly):
+def batch_job(*, accessions, subjobs, path, destination, move_promptly, queue=worker_queue) -> str:
     job = get_current_job()
+    if not job:
+        raise Exception("No current job")
     job.get_meta()
     for job_id in job.kwargs.get('subjobs',[]):
-        subjob = worker_queue.fetch_job(job_id)
+        subjob = queue.fetch_job(job_id)
         if (status := subjob.get_status()) != 'finished':
             raise Exception(f"Subjob {subjob.id} is {status}")
         if job.kwargs.get('failed', False):
@@ -156,38 +175,51 @@ def batch_job(*, accessions, subjobs, path, destination, move_promptly):
 def monitor_job():
     print("monitoring")
 
-def pause_job(job: Job):
+def pause_job(job: Job, queue=worker_queue):
+    """
+    Pause the current job, including all its subjobs.
+    """
     for job_id in job.kwargs.get('subjobs',[]):
-        subjob = worker_queue.fetch_job(job_id)
+        subjob = queue.fetch_job(job_id)
         if subjob and (subjob.is_deferred or subjob.is_queued):
             subjob.meta['paused'] = True
-            subjob.save_meta()
+            subjob.save_meta() # type: ignore
             subjob.cancel()
     job.get_meta()
     job.meta['paused'] = True
-    job.save_meta()
+    job.save_meta() # type: ignore
 
-def resume_job(job: Job):
+def resume_job(job: Job, queue=worker_queue):
+    """
+    Resume a paused job by unpausing all its subjobs
+    """
     for subjob_id in job.kwargs.get('subjobs',[]):
-        subjob = worker_queue.fetch_job(subjob_id)
+        subjob = queue.fetch_job(subjob_id)
         if subjob and subjob.meta.get('paused', None):
             subjob.meta['paused'] = False
-            subjob.save_meta()
-            worker_queue.canceled_job_registry.requeue(subjob_id)
+            subjob.save_meta() # type: ignore
+            queue.canceled_job_registry.requeue(subjob_id)
     job.get_meta()
     job.meta['paused'] = False
-    job.save_meta()
+    job.save_meta() # type: ignore
 
-def create_job(accessions, dicom_node, destination_path, offpeak=False) -> Job:
+def create_job(accessions, dicom_node, destination_path, offpeak=False, queue=worker_queue) -> Job:
+    """
+    Create a job to process the given accessions and store them in the specified destination path.
+    """
     with Connection(redis):
-        jobs = []
+        jobs: List[Job] = []
         check_job = Job.create(check_accessions_exist, kwargs=dict(accessions=accessions,node=dicom_node), meta=dict(parent=None))
 
         for accession in accessions:
-            job = Job.create(QueryJob.get_accessions, kwargs=dict(perform_func=get_accession_job, accession=accession, node=dicom_node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_batch",parent=None, paused=False, offpeak=offpeak),depends_on=[check_job])
+            job = Job.create(QueryJob.get_accessions, 
+                             kwargs=dict(perform_func=get_accession_job, accession=accession, node=dicom_node), timeout=30*60, result_ttl=-1, 
+                             meta=dict(type="get_accession_batch",parent=None, paused=False, offpeak=offpeak),
+                             depends_on=cast(List[Union[Dependency, Job]],[check_job])
+                             )
             jobs.append(job)
         depends = Dependency(
-            jobs=jobs,
+            jobs=cast(List[Union[Job,str]],jobs),
             allow_failure=True,    # allow_failure defaults to False
         )
         full_job = Job.create(batch_job, kwargs=dict(accessions=accessions, subjobs=[j.id for j in jobs], destination=destination_path, move_promptly=True), timeout=-1, result_ttl=-1, meta=dict(type="batch", started=0, paused=False,completed=0, total=len(jobs), offpeak=offpeak), depends_on=depends)
@@ -198,17 +230,20 @@ def create_job(accessions, dicom_node, destination_path, offpeak=False) -> Job:
         full_job.kwargs["path"] = Path(f"/opt/mercure/data/query/job_dirs/{full_job.id}")
         full_job.kwargs["path"].mkdir(parents=True)
 
-    worker_queue.enqueue_job(check_job)
+    queue.enqueue_job(check_job)
     for j in jobs:
-        worker_queue.enqueue_job(j)
-    worker_queue.enqueue_job(full_job)
+        queue.enqueue_job(j)
+    queue.enqueue_job(full_job)
 
     if offpeak and not _is_offpeak(config.mercure.offpeak_start, config.mercure.offpeak_end, datetime.now().time()):
         pause_job(full_job)
 
     return full_job
 
-def retry_job(job):
+def retry_job(job, queue=worker_queue) -> None:
+    """
+    Retry a failed job by enqueuing it again
+    """
     # job.meta["retries"] = job.meta.get("retries", 0) + 1
     # if job.meta["retries"] > 3:
     #     return False
@@ -218,27 +253,30 @@ def retry_job(job):
             logger.info(f"Retrying {subjob}")
             if status == "failed" and (job_path:=Path(subjob.kwargs['path'])).exists():
                 shutil.rmtree(job_path) # Clean up after a failed job
-            worker_queue.enqueue_job(subjob)
-    worker_queue.enqueue_job(job)
-def get_subjobs(job):
-    return (worker_queue.fetch_job(job) for job in job.kwargs.get('subjobs', []))
+            queue.enqueue_job(subjob)
+    queue.enqueue_job(job)
+def get_subjobs(job, queue=worker_queue) -> Generator:
+    return (queue.fetch_job(job) for job in job.kwargs.get('subjobs', []))
 
-def get_all_jobs(type):
+def get_all_jobs(type, queue=worker_queue) -> Generator:
+    """
+    Get all jobs of a given type from the queue
+    """
     registries = [
-        worker_queue.started_job_registry,  # Returns StartedJobRegistry
-        worker_queue.deferred_job_registry,   # Returns DeferredJobRegistry
-        worker_queue.finished_job_registry,  # Returns FinishedJobRegistry
-        worker_queue.failed_job_registry,  # Returns FailedJobRegistry 
-        worker_queue.scheduled_job_registry,  # Returns ScheduledJobRegistry
-        worker_queue.canceled_job_registry,   # Returns CanceledJobRegistry
+        queue.started_job_registry,  # Returns StartedJobRegistry
+        queue.deferred_job_registry,   # Returns DeferredJobRegistry
+        queue.finished_job_registry,  # Returns FinishedJobRegistry
+        queue.failed_job_registry,  # Returns FailedJobRegistry 
+        queue.scheduled_job_registry,  # Returns ScheduledJobRegistry
+        queue.canceled_job_registry,   # Returns CanceledJobRegistry
     ]
     job_ids = set()
     for registry in registries:
         for j_id in registry.get_job_ids():
             job_ids.add(j_id)
-    for j_id in worker_queue.job_ids:
+    for j_id in queue.job_ids:
         job_ids.add(j_id)
-    jobs = (worker_queue.fetch_job(j_id) for j_id in job_ids)
+    jobs = (queue.fetch_job(j_id) for j_id in job_ids)
 
     return (j for j in jobs if j.get_meta().get("type") == type)
 
@@ -251,15 +289,18 @@ def _is_offpeak(offpeak_start: str, offpeak_end: str, current_time) -> bool:
         return True
 
     if start_time < end_time:
-        return current_time >= start_time and current_time <= end_time
+        return bool(current_time >= start_time and current_time <= end_time)
     # End time is after midnight
-    return current_time >= start_time or current_time <= end_time
+    return bool(current_time >= start_time or current_time <= end_time)
 
-def update_jobs_offpeak():
+def update_jobs_offpeak(queue=worker_queue):
+    """
+    Resume or pause offpeak jobs based on whether the current time is within offpeak hours.
+    """
     config.read_config()
     is_offpeak = _is_offpeak(config.mercure.offpeak_start, config.mercure.offpeak_end, datetime.now().time())
     logger.info(f"is_offpeak {is_offpeak}")
-    for job in get_all_jobs("batch"):
+    for job in get_all_jobs("batch", queue=queue):
         if not job.meta.get("offpeak"):
             continue
         if job.get_status() not in ("waiting", "running", "queued", "deferred"):
@@ -269,18 +310,19 @@ def update_jobs_offpeak():
             logger.info(f"{job.meta}, {job.get_status()}")
             if job.meta.get("paused", False):
                 logger.info("Resuming")
-                resume_job(job)
+                resume_job(job, queue=queue)
         else:
             if not job.meta.get("paused", False):
                 logger.info("Pausing")
-                pause_job(job)
+                pause_job(job, queue=queue)
 
 @router.post("/query/retry_job")
 @requires(["authenticated", "admin"], redirect="login")
-async def test_offpeak(request):
+async def post_retry_job(request):
     job = worker_queue.fetch_job(request.query_params['id'])
     retry_job(job)
     return JSONResponse({})
+
 @router.post("/query/pause_job")
 @requires(["authenticated", "admin"], redirect="login")
 async def post_pause_job(request):
@@ -315,6 +357,8 @@ async def get_job_info(request):
     subjob_info = []
     subjobs = (worker_queue.fetch_job(job) for job in job.kwargs.get('subjobs', []))
     for subjob in subjobs:
+        if not subjob:
+            continue
         info = {
                 'id': subjob.get_id(),
                 'ended_at': subjob.ended_at.isoformat().split('.')[0] if subjob.ended_at else "", 
@@ -368,13 +412,16 @@ async def query_post(request):
             node = n
             break
     
-    worker_queue.enqueue_call(query_job, kwargs=dict(accession=form.get("accession"), node=node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_single"))
+    worker_queue.enqueue_call(get_accession_job, kwargs=dict(accession=form.get("accession"), node=node), timeout=30*60, result_ttl=-1, meta=dict(type="get_accession_single"))
     return PlainTextResponse()
 
 
 @router.get("/query/jobs")
 @requires(["authenticated", "admin"], redirect="login")
 async def query_jobs(request):
+    """
+    Returns a list of all query jobs. 
+    """
     job_info = []
     for job in get_all_jobs("batch"):
         job_dict = dict(id=job.id, 
diff --git a/webinterface/query.py b/webinterface/query.py
index 40187abb..54b87d4d 100644
--- a/webinterface/query.py
+++ b/webinterface/query.py
@@ -1,5 +1,6 @@
 import os
 import re
+from typing import Any, Iterator, List, Optional, Sequence, cast
 from pynetdicom import (
         AE,
         QueryRetrievePresentationContexts, BasicWorklistManagementPresentationContexts, UnifiedProcedurePresentationContexts,
@@ -7,11 +8,11 @@
         evt,
         StoragePresentationContexts
     )
-from pynetdicom.sop_class import StudyRootQueryRetrieveInformationModelFind
+from pynetdicom.sop_class import StudyRootQueryRetrieveInformationModelFind # type: ignore
 from pynetdicom.apps.common import create_dataset
 from pynetdicom._globals import DEFAULT_MAX_LENGTH
 from pynetdicom.pdu_primitives import SOPClassExtendedNegotiation
-from pynetdicom.sop_class import (
+from pynetdicom.sop_class import (  # type: ignore
     PatientRootQueryRetrieveInformationModelGet,
     StudyRootQueryRetrieveInformationModelGet,
     PatientStudyOnlyQueryRetrieveInformationModelGet,
@@ -19,12 +20,11 @@
     EncapsulatedOBJStorage,
     EncapsulatedMTLStorage,
 )
-from pydicom.uid import DeflatedExplicitVRLittleEndian
+from pydicom.uid import DeflatedExplicitVRLittleEndian 
 from pydicom import Dataset
 import sys
 import subprocess
 
-
 class DicomClientCouldNotAssociate(Exception):
     pass
 
@@ -58,7 +58,7 @@ class SimpleDicomClient():
     port: int
     called_aet: str
     output_dir: str
-    def __init__(self, host, port, called_aet, out_dir):
+    def __init__(self, host, port, called_aet, out_dir) -> None:
         self.host = host
         self.port = port
         self.called_aet = called_aet
@@ -124,7 +124,7 @@ def handle_store(self, event):
         return status_ds
 
 
-    def getscu(self, accession_number):
+    def getscu(self, accession_number) -> Iterator[Dataset]:
         # Exclude these SOP Classes
         _exclusion = [
             EncapsulatedSTLStorage,
@@ -145,6 +145,8 @@ def getscu(self, accession_number):
         ae.add_requested_context(PatientStudyOnlyQueryRetrieveInformationModelGet)
         ext_neg = []
         for cx in store_contexts:
+            if not cx.abstract_syntax:
+                raise ValueError(f"Abstract syntax must be specified for storage context {cx}")
             ae.add_requested_context(cx.abstract_syntax)
             # Add SCP/SCU Role Selection Negotiation to the extended negotiation
             # We want to act as a Storage SCP
@@ -153,7 +155,7 @@ def getscu(self, accession_number):
         assoc = ae.associate(
                 self.host, self.port,
                 ae_title=self.called_aet,
-                ext_neg=ext_neg,
+                ext_neg=ext_neg, # type: ignore
                 evt_handlers=[(evt.EVT_C_STORE, self.handle_store, [])],
                 max_pdu=0,
             )
@@ -181,7 +183,7 @@ def getscu(self, accession_number):
 
         assoc.release()
 
-    def findscu(self,accession_number):
+    def findscu(self,accession_number) -> Optional[Dataset]:
         # Create application entity
         ae = AE(ae_title="MERCURE")
 
diff --git a/webinterface/rules.py b/webinterface/rules.py
index 453964e9..71f869b5 100755
--- a/webinterface/rules.py
+++ b/webinterface/rules.py
@@ -6,7 +6,7 @@
 
 # Standard python includes
 import daiquiri
-from typing import Dict
+from typing import Any, Dict, Set
 import json
 
 # Starlette-related includes
@@ -252,7 +252,7 @@ async def rules_delete_post(request) -> Response:
 @requires(["authenticated", "admin"], redirect="login")
 async def rules_test(request) -> Response:
     """Evalutes if a given routing rule is valid. The rule and testing dictionary have to be passed as form parameters."""
-    noresult = set()
+    noresult: Set[Any] = set()
     attrs_accessed = set()
     try:
         form = dict(await request.form())

From 761526125ff9c518b524d235956f8fe10d7e9a92 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 28 Jun 2024 17:56:08 +0000
Subject: [PATCH 12/42] initial work on dicom query/pull interface

---
 common/types.py                               |  12 +-
 webgui.py                                     |  19 +-
 webinterface/common.py                        |  11 +-
 webinterface/dashboards.py                    |  59 -----
 webinterface/dashboards/__init__.py           |   7 +
 webinterface/dashboards/common.py             |   7 +
 webinterface/dashboards/query.py              |  77 ++++++
 webinterface/dashboards/simple.py             |  32 +++
 webinterface/modules.py                       |   6 +-
 webinterface/query.py                         | 236 ++++++++++++++++++
 webinterface/queue.py                         |   2 -
 webinterface/rules.py                         |   4 -
 webinterface/targets.py                       |   2 -
 .../templates/dashboards/dashboards.html      |   1 +
 webinterface/templates/dashboards/query.html  | 117 +++++++++
 webinterface/users.py                         |   5 +-
 16 files changed, 508 insertions(+), 89 deletions(-)
 delete mode 100644 webinterface/dashboards.py
 create mode 100644 webinterface/dashboards/__init__.py
 create mode 100644 webinterface/dashboards/common.py
 create mode 100644 webinterface/dashboards/query.py
 create mode 100644 webinterface/dashboards/simple.py
 create mode 100644 webinterface/query.py
 create mode 100644 webinterface/templates/dashboards/query.html

diff --git a/common/types.py b/common/types.py
index 33e89511..9558db6c 100755
--- a/common/types.py
+++ b/common/types.py
@@ -178,6 +178,16 @@ class DicomReceiverConfig(BaseModel):
     additional_tags: Dict[str,str] = {}
     
 
+class DicomNode(BaseModel):
+    name: str
+    ip: str
+    port: int
+    aet_target: str
+    aet_source: Optional[str] = ""
+
+class DicomRetrieveConfig(BaseModel):
+    dicom_nodes: List[DicomNode] = []
+
 class Config(BaseModel, Compat):
     appliance_name: str
     port: int
@@ -220,7 +230,7 @@ class Config(BaseModel, Compat):
     email_notification_from: str = "mercure@mercure.mercure"
     support_root_modules: Optional[bool] = False
     webhook_certificate_location: Optional[str] = None
-
+    dicom_retrieve: DicomRetrieveConfig = DicomRetrieveConfig()
 
 class TaskInfo(BaseModel, Compat):
     action: Literal["route", "both", "process", "discard", "notification"]
diff --git a/webgui.py b/webgui.py
index 911df1de..41ff981e 100755
--- a/webgui.py
+++ b/webgui.py
@@ -295,7 +295,7 @@ async def show_log(request) -> Response:
     template = "logs.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
+        
         "page": "logs",
         "service_logs": service_logs,
         "log_id": requested_service,
@@ -307,7 +307,6 @@ async def show_log(request) -> Response:
         "end_time_available": runtime == "systemd",
         "start_time_available": runtime in ("docker", "systemd"),
     }
-    context.update(get_user_information(request))
     return templates.TemplateResponse(template, context)
 
 
@@ -330,14 +329,13 @@ async def configuration(request) -> Response:
     runtime = helper.get_runner()
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
+        
         "page": "configuration",
         "config": config.mercure,
         "os_string": os_string,
         "config_edited": config_edited,
         "runtime": runtime,
     }
-    context.update(get_user_information(request))
     return templates.TemplateResponse(template, context)
 
 
@@ -363,11 +361,10 @@ async def configuration_edit(request) -> Response:
     template = "configuration_edit.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
+        
         "page": "configuration",
         "config_content": config_content,
     }
-    context.update(get_user_information(request))
     return templates.TemplateResponse(template, context)
 
 
@@ -411,7 +408,7 @@ async def login(request) -> Response:
     template = "login.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
+        
         "appliance_name": config.mercure.get("appliance_name", "master"),
     }
     return templates.TemplateResponse(template, context)
@@ -599,7 +596,7 @@ async def login_post(request) -> Response:
         context = {
             "request": request,
             "invalid_password": 1,
-            "mercure_version": mercure_defs.VERSION,
+            
             "appliance_name": config.mercure.get("appliance_name", "mercure Router"),
         }
         return templates.TemplateResponse(template, context)
@@ -627,14 +624,13 @@ async def settings_edit(request) -> Response:
     template = "users_edit.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
+        
         "page": "settings",
         "edituser": own_name,
         "edituser_info": users.users_list[own_name],
         "own_settings": "True",
         "change_password": users.users_list[own_name].get("change_password", "False"),
     }
-    context.update(get_user_information(request))
     return templates.TemplateResponse(template, context)
 
 
@@ -710,7 +706,7 @@ async def homepage(request) -> Response:
     template = "index.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
+        
         "page": "homepage",
         "used_space": used_space,
         "free_space": free_space,
@@ -718,7 +714,6 @@ async def homepage(request) -> Response:
         "service_status": service_status,
         "runtime": runtime,
     }
-    context.update(get_user_information(request))
     return templates.TemplateResponse(template, context)
 
 
diff --git a/webinterface/common.py b/webinterface/common.py
index a870dd35..60e65adb 100755
--- a/webinterface/common.py
+++ b/webinterface/common.py
@@ -7,14 +7,18 @@
 # Standard python includes
 from typing import Optional, Tuple
 import asyncio
+from redis import Redis
+from rq import Queue, Connection
 
 # Starlette-related includes
 from starlette.templating import Jinja2Templates
 
+from common.constants import mercure_defs
 
-templates = Jinja2Templates(directory="webinterface/templates")
 
 
+worker_queue = Queue(connection=Redis())
+
 def get_user_information(request) -> dict:
     """Returns dictionary of values that should always be passed to the templates when the user is logged in."""
     return {
@@ -23,6 +27,11 @@ def get_user_information(request) -> dict:
         "is_admin": request.user.is_admin if request.user.is_authenticated else False,
     }
 
+def get_mercure_version(request) -> dict:
+    return { "mercure_version": mercure_defs.VERSION }
+
+templates = Jinja2Templates(directory="webinterface/templates", context_processors=[get_user_information, get_mercure_version])
+
 
 async def async_run(cmd, **params) -> Tuple[Optional[int], bytes, bytes]:
     """Executes the given command in a way compatible with ayncio."""
diff --git a/webinterface/dashboards.py b/webinterface/dashboards.py
deleted file mode 100644
index d441f192..00000000
--- a/webinterface/dashboards.py
+++ /dev/null
@@ -1,59 +0,0 @@
-"""
-test.py
-========
-Test page for querying the bookkeeper database from the webgui.
-"""
-
-# Standard python includes
-import daiquiri
-
-# Starlette-related includes
-from starlette.applications import Starlette
-from starlette.authentication import requires
-
-# App-specific includes
-from common.constants import mercure_defs
-from webinterface.common import get_user_information
-from webinterface.common import templates
-import common.config as config
-from starlette.responses import RedirectResponse
-from decoRouter import Router as decoRouter
-router = decoRouter()
-
-logger = config.get_logger()
-
-###################################################################################
-## Test endpoints
-###################################################################################
-
-@router.get("/")
-async def index(request):
-    return RedirectResponse(url="tests")
-
-
-@router.get("/tasks")
-@requires("authenticated", redirect="login")
-async def tasks(request):
-    template = "dashboards/tasks.html"
-    context = {
-        "request": request,
-        "mercure_version": mercure_defs.VERSION,
-        "page": "tasks",
-    }
-    context.update(get_user_information(request))
-    return templates.TemplateResponse(template, context)
-
-
-@router.get("/tests")
-@requires(["authenticated", "admin"], redirect="login")
-async def tests(request):
-    template = "dashboards/tests.html"
-    context = {
-        "request": request,
-        "mercure_version": mercure_defs.VERSION,
-        "page": "tests",
-    }
-    context.update(get_user_information(request))
-    return templates.TemplateResponse(template, context)
-
-dashboards_app = Starlette(routes=router)
\ No newline at end of file
diff --git a/webinterface/dashboards/__init__.py b/webinterface/dashboards/__init__.py
new file mode 100644
index 00000000..7fb55b79
--- /dev/null
+++ b/webinterface/dashboards/__init__.py
@@ -0,0 +1,7 @@
+from .common import router
+from . import query, simple
+from starlette.applications import Starlette
+
+
+
+dashboards_app = Starlette(routes=router)
\ No newline at end of file
diff --git a/webinterface/dashboards/common.py b/webinterface/dashboards/common.py
new file mode 100644
index 00000000..f4eae329
--- /dev/null
+++ b/webinterface/dashboards/common.py
@@ -0,0 +1,7 @@
+from decoRouter import Router as decoRouter
+from starlette.responses import RedirectResponse
+
+router = decoRouter()
+@router.get("/")
+async def index(request):
+    return RedirectResponse(url="tests")
\ No newline at end of file
diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
new file mode 100644
index 00000000..e27f0740
--- /dev/null
+++ b/webinterface/dashboards/query.py
@@ -0,0 +1,77 @@
+
+from webinterface.query import SimpleDicomClient
+# Standard python includes
+from datetime import datetime
+
+# Starlette-related includes
+from starlette.authentication import requires
+
+# App-specific includes
+from common.constants import mercure_defs
+from webinterface.common import templates
+import common.config as config
+from starlette.responses import PlainTextResponse, JSONResponse
+from webinterface.common import worker_queue
+from rq import get_current_job
+
+from .common import router
+logger = config.get_logger()
+
+def test_job(*,accession, node):
+    config.read_config()
+    c = SimpleDicomClient(node.ip, node.port, node.aet_target, config.mercure.incoming_folder)
+    for identifier in c.getscu(accession):
+        job = get_current_job()
+        job.meta['failed'] = identifier.NumberOfFailedSuboperations
+        job.meta['remaining'] = identifier.NumberOfRemainingSuboperations
+        job.meta['completed'] = identifier.NumberOfCompletedSuboperations
+        job.save_meta()
+    return "Complete"
+
+@router.post("/query")
+@requires(["authenticated", "admin"], redirect="login")
+async def query_post(request):
+    form = await request.form()
+
+    for n in config.mercure.dicom_retrieve.dicom_nodes:
+        if n.name == form.get("dicom_node"):
+            node = n
+            break
+    
+    worker_queue.enqueue_call(test_job, kwargs=dict(accession=form.get("accession"), node=node), timeout='10m', result_ttl=-1)
+    return PlainTextResponse()
+
+@router.get("/query/jobs")
+@requires(["authenticated", "admin"], redirect="login")
+async def query_jobs(request):
+    registries = [
+        worker_queue.started_job_registry,  # Returns StartedJobRegistry
+        worker_queue.deferred_job_registry,   # Returns DeferredJobRegistry
+        worker_queue.finished_job_registry,  # Returns FinishedJobRegistry
+        worker_queue.failed_job_registry,  # Returns FailedJobRegistry 
+        worker_queue.scheduled_job_registry,  # Returns ScheduledJobRegistry
+    ]
+    job_info = []
+    for r in registries:
+        for j_id in r.get_job_ids():
+            job = worker_queue.fetch_job(j_id)
+            job_info.append(dict(id=j_id, 
+                                 status=job.get_status(), 
+                                 parameters=dict(accession=job.kwargs.get('accession','')), 
+                                 enqueued_at=1000*datetime.timestamp(job.enqueued_at), 
+                                 result=job.result, 
+                                 meta=job.meta))
+    return JSONResponse(dict(data=job_info))
+    # return PlainTextResponse(",".join([str(j) for j in all_jobs]))
+
+@router.get("/query")
+@requires(["authenticated", "admin"], redirect="login")
+async def query(request):
+    template = "dashboards/query.html"
+    context = {
+        "request": request,
+        
+        "dicom_nodes": config.mercure.dicom_retrieve.dicom_nodes,
+        "page": "query",
+    }
+    return templates.TemplateResponse(template, context)
\ No newline at end of file
diff --git a/webinterface/dashboards/simple.py b/webinterface/dashboards/simple.py
new file mode 100644
index 00000000..c1a2ad47
--- /dev/null
+++ b/webinterface/dashboards/simple.py
@@ -0,0 +1,32 @@
+from .common import router
+from starlette.authentication import requires
+
+# App-specific includes
+from common.constants import mercure_defs
+from webinterface.common import get_user_information, templates
+import common.config as config
+logger = config.get_logger()
+from .common import router
+
+@router.get("/tasks")
+@requires("authenticated", redirect="login")
+async def tasks(request):
+    template = "dashboards/tasks.html"
+    context = {
+        "request": request,
+        
+        "page": "tasks",
+    }
+    return templates.TemplateResponse(template, context)
+
+
+@router.get("/tests")
+@requires(["authenticated", "admin"], redirect="login")
+async def tests(request):
+    template = "dashboards/tests.html"
+    context = {
+        "request": request,
+        
+        "page": "tests",
+    }
+    return templates.TemplateResponse(template, context)
\ No newline at end of file
diff --git a/webinterface/modules.py b/webinterface/modules.py
index 34047fc8..fdf89644 100755
--- a/webinterface/modules.py
+++ b/webinterface/modules.py
@@ -101,12 +101,11 @@ async def show_modules(request):
     template = "modules.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
+        
         "page": "modules",
         "modules": config.mercure.modules,
         "used_modules": used_modules,
     }
-    context.update(get_user_information(request))
     return templates.TemplateResponse(template, context)
 
 
@@ -204,7 +203,7 @@ async def edit_module(request):
     template = "modules_edit.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
+        
         "page": "modules",
         "module": config.mercure.modules[module],
         "module_name": module,
@@ -212,7 +211,6 @@ async def edit_module(request):
         "runtime": runtime,
         "support_root_modules": config.mercure.support_root_modules,
     }
-    context.update(get_user_information(request))
     return templates.TemplateResponse(template, context)
 
 
diff --git a/webinterface/query.py b/webinterface/query.py
new file mode 100644
index 00000000..fa1077e2
--- /dev/null
+++ b/webinterface/query.py
@@ -0,0 +1,236 @@
+import os
+import re
+from pynetdicom import (
+        AE,
+        QueryRetrievePresentationContexts, BasicWorklistManagementPresentationContexts, UnifiedProcedurePresentationContexts,
+        build_role,
+        evt,
+        StoragePresentationContexts
+    )
+from pynetdicom.sop_class import StudyRootQueryRetrieveInformationModelFind
+from pynetdicom.apps.common import create_dataset
+from pynetdicom._globals import DEFAULT_MAX_LENGTH
+from pynetdicom.pdu_primitives import SOPClassExtendedNegotiation
+from pynetdicom.sop_class import (
+    PatientRootQueryRetrieveInformationModelGet,
+    StudyRootQueryRetrieveInformationModelGet,
+    PatientStudyOnlyQueryRetrieveInformationModelGet,
+    EncapsulatedSTLStorage,
+    EncapsulatedOBJStorage,
+    EncapsulatedMTLStorage,
+)
+from pydicom.uid import DeflatedExplicitVRLittleEndian
+from pydicom import Dataset
+import sys
+import subprocess
+
+
+class DicomClientCouldNotAssociate(Exception):
+    pass
+
+class DicomClientCouldNotFind(Exception):
+    pass
+
+class DicomClientBadStatus(Exception):
+    pass
+
+SOP_CLASS_PREFIXES = {
+    "1.2.840.10008.5.1.4.1.1.2": ("CT", "CT Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.2.1": ("CTE", "Enhanced CT Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.4": ("MR", "MR Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.4.1": ("MRE", "Enhanced MR Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.128": ("PT", "Positron Emission Tomography Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.130": ("PTE", "Enhanced PET Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.481.1": ("RI", "RT Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.481.2": ("RD", "RT Dose Storage"),
+    "1.2.840.10008.5.1.4.1.1.481.5": ("RP", "RT Plan Storage"),
+    "1.2.840.10008.5.1.4.1.1.481.3": ("RS", "RT Structure Set Storage"),
+    "1.2.840.10008.5.1.4.1.1.1": ("CR", "Computed Radiography Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.6.1": ("US", "Ultrasound Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.6.2": ("USE", "Enhanced US Volume Storage"),
+    "1.2.840.10008.5.1.4.1.1.12.1": ("XA", "X-Ray Angiographic Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.12.1.1": ("XAE", "Enhanced XA Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.20": ("NM", "Nuclear Medicine Image Storage"),
+    "1.2.840.10008.5.1.4.1.1.7": ("SC", "Secondary Capture Image Storage"),
+}
+class SimpleDicomClient():
+    host: str
+    port: int
+    called_aet: str
+    output_dir: str
+    def __init__(self, host, port, called_aet, out_dir):
+        self.host = host
+        self.port = port
+        self.called_aet = called_aet
+        self.output_dir = out_dir
+    
+    def handle_store(self, event):
+        try:
+            ds = event.dataset
+            # Remove any Group 0x0002 elements that may have been included
+            ds = ds[0x00030000:]
+        except Exception as exc:
+            print(exc)
+            return 0x210
+        try:
+            sop_class = ds.SOPClassUID
+            # sanitize filename by replacing all illegal characters with underscores
+            sop_instance = re.sub(r"[^\d.]", "_", ds.SOPInstanceUID)
+        except Exception as exc:
+            print(
+                "Unable to decode the received dataset or missing 'SOP Class "
+                "UID' and/or 'SOP Instance UID' elements"
+            )
+            print(exc)
+            # Unable to decode dataset
+            return 0xC210
+
+        try:
+            # Get the elements we need
+            mode_prefix = SOP_CLASS_PREFIXES[sop_class][0]
+        except KeyError:
+            mode_prefix = "UN"
+
+        filename = f"{self.output_dir}/{mode_prefix}.{sop_instance}"
+        print(f"Storing DICOM file: {filename}")
+
+        status_ds = Dataset()
+        status_ds.Status = 0x0000
+        try:
+            if event.context.transfer_syntax == DeflatedExplicitVRLittleEndian:
+                # Workaround for pydicom issue #1086
+                with open(filename, "wb") as f:
+                    f.write(event.encoded_dataset())
+            else:
+                # We use `write_like_original=False` to ensure that a compliant
+                #   File Meta Information Header is written
+                ds.save_as(filename, write_like_original=False)
+
+            status_ds.Status = 0x0000  # Success
+        except OSError as exc:
+            print("Could not write file to specified directory:")
+            print(f"    {os.path.dirname(filename)}")
+            print(exc)
+            # Failed - Out of Resources - OSError
+            status_ds.Status = 0xA700
+        except Exception as exc:
+            print("Could not write file to specified directory:")
+            print(f"    {os.path.dirname(filename)}")
+            print(exc)
+            # Failed - Out of Resources - Miscellaneous error
+            status_ds.Status = 0xA701
+
+        subprocess.run(["/opt/mercure/app/bin/ubuntu22.04/getdcmtags", filename, self.called_aet, "MERCURE"]) 
+        return status_ds
+
+
+    def getscu(self, accession_number):
+        # Exclude these SOP Classes
+        _exclusion = [
+            EncapsulatedSTLStorage,
+            EncapsulatedOBJStorage,
+            EncapsulatedMTLStorage,
+        ]
+        store_contexts = [
+            cx for cx in StoragePresentationContexts if cx.abstract_syntax not in _exclusion
+        ]
+        ae = AE(ae_title="MERCURE")
+        # Create application entity
+        # Binding to port 0 lets the OS pick an available port
+        ae.acse_timeout = 30
+        ae.dimse_timeout = 30
+        ae.network_timeout = 30
+        ae.add_requested_context(PatientRootQueryRetrieveInformationModelGet)
+        ae.add_requested_context(StudyRootQueryRetrieveInformationModelGet)
+        ae.add_requested_context(PatientStudyOnlyQueryRetrieveInformationModelGet)
+        ext_neg = []
+        for cx in store_contexts:
+            ae.add_requested_context(cx.abstract_syntax)
+            # Add SCP/SCU Role Selection Negotiation to the extended negotiation
+            # We want to act as a Storage SCP
+            ext_neg.append(build_role(cx.abstract_syntax, scp_role=True))
+        query_model = StudyRootQueryRetrieveInformationModelGet
+        assoc = ae.associate(
+                self.host, self.port,
+                ae_title=self.called_aet,
+                ext_neg=ext_neg,
+                evt_handlers=[(evt.EVT_C_STORE, self.handle_store, [])],
+                max_pdu=0,
+            )
+        if not assoc.is_established:
+            raise DicomClientCouldNotAssociate()
+            # Send query
+
+        ds = Dataset()
+        ds.QueryRetrieveLevel = 'STUDY'
+        ds.AccessionNumber = accession_number
+
+        responses = assoc.send_c_get(ds, query_model)
+        success = False
+        for status, rsp_identifier in responses:
+            # If `status.Status` is one of the 'Pending' statuses then
+            #   `rsp_identifier` is the C-GET response's Identifier dataset
+            if not status:
+                raise DicomClientBadStatus()
+            
+            if status.Status in [0xFF00, 0xFF01]:
+                yield status
+                success = True
+        if not success:
+            raise DicomClientCouldNotFind()
+
+        assoc.release()
+
+    def findscu(self,accession_number):
+        # Create application entity
+        ae = AE(ae_title=calling_aet)
+
+        # Add a requested presentation context
+        # ae.add_requested_context(StudyRootQueryRetrieveInformationModelFind)
+        ae.requested_contexts = QueryRetrievePresentationContexts
+                # + BasicWorklistManagementPresentationContexts
+                # + UnifiedProcedurePresentationContexts )
+
+        # Associate with the peer AE
+        assoc = ae.associate(self.host, self.port, ae_title=self.called_aet, max_pdu=0, ext_neg=[])
+
+        ds = Dataset()
+        ds.QueryRetrieveLevel = 'STUDY'
+        ds.AccessionNumber = accession_number
+        if not assoc.is_established:
+            raise DicomClientCouldNotAssociate()
+
+        try:
+            responses = assoc.send_c_find(
+                ds,
+                StudyRootQueryRetrieveInformationModelFind
+            )
+
+            for (status, identifier) in responses:
+                if not status:
+                    print('Connection timed out, was aborted or received invalid response')
+                    break
+
+                if status.Status in [0xFF00, 0xFF01]:
+                    # print('C-FIND query status: 0x{0:04x}'.format(status.Status))
+                    return identifier
+                # elif status.Status == 0x0000:
+                #     print("Success")
+                #     break
+            raise DicomClientCouldNotFind()
+        finally:
+            assoc.release()
+
+if __name__ == "__main__":
+    # Replace these variables with your actual values
+    remote_host = sys.argv[1]
+    remote_port = int(sys.argv[2])
+    calling_aet = sys.argv[3]
+    called_aet = sys.argv[4]
+    accession_number = sys.argv[5]
+
+    print(f"{remote_host=} {remote_port=} {calling_aet=} {called_aet=} {accession_number=}")
+    c = SimpleDicomClient(remote_host, remote_port, called_aet, "/tmp/test-move")
+    # study_uid = c.get_study_uid(accession_number)
+    # print(study_uid)
+    c.getscu(accession_number)
\ No newline at end of file
diff --git a/webinterface/queue.py b/webinterface/queue.py
index b104134c..de92bcd1 100755
--- a/webinterface/queue.py
+++ b/webinterface/queue.py
@@ -57,12 +57,10 @@ async def show_queues(request):
     template = "queue.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
         "page": "queue",
         "processing_suspended": processing_suspended,
         "routing_suspended": routing_suspended,
     }
-    context.update(get_user_information(request))
     return templates.TemplateResponse(template, context)
 
 
diff --git a/webinterface/rules.py b/webinterface/rules.py
index ac7b8e79..453964e9 100755
--- a/webinterface/rules.py
+++ b/webinterface/rules.py
@@ -47,11 +47,9 @@ async def show_rules(request) -> Response:
     template = "rules.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
         "page": "rules",
         "rules": config.mercure.rules,
     }
-    context.update(get_user_information(request))
     return templates.TemplateResponse(template, context)
 
 
@@ -112,7 +110,6 @@ async def rules_edit(request) -> Response:
 
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
         "page": "rules",
         "rules": config.mercure.rules,
         "targets": config.mercure.targets,
@@ -123,7 +120,6 @@ async def rules_edit(request) -> Response:
         "processing_settings": settings_string,
         "process_runner": config.mercure.process_runner
     }
-    context.update(get_user_information(request))
 
     template = "rules_edit.html"
     return templates.TemplateResponse(template, context)
diff --git a/webinterface/targets.py b/webinterface/targets.py
index bf78ceb6..9dddb525 100755
--- a/webinterface/targets.py
+++ b/webinterface/targets.py
@@ -50,7 +50,6 @@ async def show_targets(request) -> Response:
     template = "targets.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
         "page": "targets",
         "targets": config.mercure.targets,
         "used_targets": used_targets,
@@ -104,7 +103,6 @@ async def targets_edit(request) -> Response:
     template = "targets_edit.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
         "page": "targets",
         "targets": config.mercure.targets,
         "edittarget": edittarget,
diff --git a/webinterface/templates/dashboards/dashboards.html b/webinterface/templates/dashboards/dashboards.html
index 2cb4c137..afe990b0 100644
--- a/webinterface/templates/dashboards/dashboards.html
+++ b/webinterface/templates/dashboards/dashboards.html
@@ -7,6 +7,7 @@
     <ul>
       <li class="{% if page == 'tests' %}is-active{% endif %}"><a href="tests">Self-test</a></li>
       <li class="{% if page == 'tasks' %}is-active{% endif %}"><a href="tasks">Tasks</a></li>
+      <li class="{% if page == 'query' %}is-active{% endif %}"><a href="query">Query</a></li>
     </ul>
   </div>
   </div>
diff --git a/webinterface/templates/dashboards/query.html b/webinterface/templates/dashboards/query.html
new file mode 100644
index 00000000..48756c04
--- /dev/null
+++ b/webinterface/templates/dashboards/query.html
@@ -0,0 +1,117 @@
+{% extends "dashboards/dashboards.html" %}
+
+{% block title %}Query{% endblock %}
+
+{% block extra_head %}
+    <script type="text/javascript" src="{{ url_for('static', path='DataTables/datatables.min.js') }}"></script>
+    <link rel="stylesheet" type="text/css" href="{{ url_for('static', path='DataTables/datatables.min.css') }}"/>  
+{% endblock %}
+
+{% block dashboard_content %}
+<main role="main">
+    <h1 class="title">DICOM Query</h1>
+    <div class="container">
+        <form class="box" id="form" hx-post="query" hx-target="#query_result" hx-swap="innerHTML">
+            <div class="field is-horizontal">
+              <div class="field-label is-normal">
+                <label class="label">Accession</label>
+              </div>
+              <div class="field-body">
+                <div class="field">
+                  <div class="control is-expanded">
+                    <div class="control">
+                        <input name="accession" class="input" type="text" placeholder="00000" value="">
+                      </div>
+                  </div>
+                </div>
+              </div>
+            </div>
+            <div class="field is-horizontal">
+              <div class="field-label is-normal">
+                <label class="label">Dicom Node</label>
+              </div>
+              <div class="field-body">
+                <div class="field">
+                  <div class="control is-expanded">
+                    <div class="select">
+                        <select name="dicom_node">
+                          {% for node in dicom_nodes %}
+                          <option>{{ node.name }}</option>
+                          {% endfor %}
+                        </select>
+                      </div>
+                  </div>
+                </div>
+              </div>
+            </div>
+
+            <div class="field is-horizontal">
+              <div class="field-label">
+                <!-- Left empty for spacing -->
+              </div>
+              <div class="field-body">
+                <div class="field">
+                  <div class="control">
+                    <button type="submit" class="button is-primary">
+                      Query
+                    </button>
+                  </div>
+                </div>
+              </div>
+            </div>
+          </div> 
+          </form>
+          <div id="query_result"></div>
+        <div class="columns">
+
+        <div class="column">
+            <table class="table is-narrow is-hoverable is-fullwidth jobtable" id="casetable">
+                <thead>
+                    <tr>
+                        <th>id</th>
+                        <th>status</th>
+                        <th>enqueued_at</th>
+                        <th>accession</th>
+                        <th>result</th>
+                        <th>progress</th>
+                    </tr>
+                </thead>
+                <tbody>
+                </tbody>
+            </table>
+            </div>
+            </div>
+    </div>
+</main>
+<script>
+$(document).ready(function () {      
+    $("#form").on('htmx:afterOnLoad', (event) => {
+        datatable.ajax.reload();
+});
+    window.datatable = $('#casetable').DataTable({           
+        dom: "<'row browsertoolbar align-items-end'<'col-sm-12 col-md-7 browserbuttons'B><'col-sm-12 col-md-2'><'col-sm-12 col-md-3'f>>" + "<'row'<'col-sm-12'tr>>" + "<'row browserfooterbar'<'col-sm-12 col-md-5'l><'col-sm-12 col-md-7'p>>",
+        ajax: "query/jobs",
+        deferRender: true,
+        columns: [
+            { data: 'id' },
+            { data: 'status' },
+            { data: 'enqueued_at', render: data => `<span style="display:none;">${data}</span>`+new Date(data).toLocaleString("en-US")},
+            { data: 'parameters', render: data => data["accession"] || ""},
+            { data: 'result' },
+            { data: 'meta', render: data => data["completed"]?`${data["completed"]}/${data["remaining"]+data["completed"]}`:"" },
+        ],
+        select: {
+            style: 'os'
+        },
+        language: {
+            "emptyTable": "No messages available on server."
+        },
+        // filter: true,
+        buttons: [],
+        order: [[2, 'desc']],
+        initComplete: function() {             
+        }
+    });
+});
+</script>
+{% endblock %}
\ No newline at end of file
diff --git a/webinterface/users.py b/webinterface/users.py
index 1d70f57f..f7b7276b 100755
--- a/webinterface/users.py
+++ b/webinterface/users.py
@@ -187,8 +187,7 @@ async def show_users(request) -> Response:
         return PlainTextResponse("Configuration is being updated. Try again in a minute.")
 
     template = "users.html"
-    context = {"request": request, "mercure_version": mercure_defs.VERSION, "page": "users", "users": users_list}
-    context.update(get_user_information(request))
+    context = {"request": request,  "page": "users", "users": users_list}
     return templates.TemplateResponse(template, context)
 
 
@@ -237,12 +236,10 @@ async def users_edit(request) -> Response:
     template = "users_edit.html"
     context = {
         "request": request,
-        "mercure_version": mercure_defs.VERSION,
         "page": "users",
         "edituser": edituser,
         "edituser_info": users_list[edituser],
     }
-    context.update(get_user_information(request))
     return templates.TemplateResponse(template, context)
 
 

From 6a6eabad23e1e7a27c8c767c31a9224d351c8ba4 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 28 Jun 2024 17:57:21 +0000
Subject: [PATCH 13/42] beginner support for batch process

---
 requirements.in                               |  10 +-
 requirements.txt                              |  18 +--
 webinterface/common.py                        |   7 +-
 webinterface/dashboards/query.py              | 146 ++++++++++++++++--
 webinterface/templates/dashboards/query.html  |  36 ++++-
 .../dashboards/query_job_fragment.html        |  29 ++++
 6 files changed, 216 insertions(+), 30 deletions(-)
 create mode 100644 webinterface/templates/dashboards/query_job_fragment.html

diff --git a/requirements.in b/requirements.in
index c01e860c..62c8df45 100644
--- a/requirements.in
+++ b/requirements.in
@@ -57,8 +57,10 @@ pillow >= 10.0.1
 dicomweb-client
 boto3
 freezegun
-certifi>=2023.07.22
-future>=0.18.3
-lxml>=4.9.1
+certifi >= 2023.07.22
+future >= 0.18.3
+lxml >= 4.9.1
 pyxnat
-urllib3>=1.26.18
\ No newline at end of file
+urllib3 >= 1.26.18
+rq ~= 1.16.2
+rq-scheduler ~= 0.13.1
\ No newline at end of file
diff --git a/requirements.txt b/requirements.txt
index 041369e5..a2f6d411 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -2,7 +2,7 @@
 # This file is autogenerated by pip-compile with Python 3.10
 # by the following command:
 #
-#    pip-compile requirements.in
+#    pip-compile
 #
 aiofiles==23.2.1
     # via -r requirements.in
@@ -25,6 +25,7 @@ async-timeout==4.0.3
     #   aiohttp
     #   aiopg
     #   asyncpg
+    #   redis
 asyncpg==0.29.0
     # via -r requirements.in
 attrs==23.2.0
@@ -45,7 +46,9 @@ certifi==2024.6.2
 charset-normalizer==3.3.2
     # via requests
 click==8.1.7
-    # via uvicorn
+    # via
+    #   rq
+    #   uvicorn
 daiquiri==3.2.5.1
     # via -r requirements.in
 databases[aiopg]==0.8.0
@@ -176,16 +179,13 @@ pyxnat==1.6.2
 reactivex==4.0.4
     # via influxdb-client
 requests==2.32.3
-    # via
-    #   dicomweb-client
-    #   docker
-    #   python-nomad
-    #   pyxnat
-    #   sphinx
+redis==5.0.4
+    # via rq
 retrying==1.3.4
     # via dicomweb-client
 s3transfer==0.10.1
-    # via boto3
+rq==1.16.2
+    # via -r requirements.in
 six==1.16.0
     # via
     #   python-dateutil
diff --git a/webinterface/common.py b/webinterface/common.py
index 60e65adb..25a35efd 100755
--- a/webinterface/common.py
+++ b/webinterface/common.py
@@ -14,10 +14,11 @@
 from starlette.templating import Jinja2Templates
 
 from common.constants import mercure_defs
+from rq_scheduler import Scheduler
 
-
-
-worker_queue = Queue(connection=Redis())
+redis = Redis()
+worker_queue = Queue(connection=redis)
+worker_scheduler = Scheduler(queue=worker_queue, connection=worker_queue.connection) 
 
 def get_user_information(request) -> dict:
     """Returns dictionary of values that should always be passed to the templates when the user is logged in."""
diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
index e27f0740..8dd692de 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query.py
@@ -2,7 +2,7 @@
 from webinterface.query import SimpleDicomClient
 # Standard python includes
 from datetime import datetime
-
+import time, random
 # Starlette-related includes
 from starlette.authentication import requires
 
@@ -11,34 +11,139 @@
 from webinterface.common import templates
 import common.config as config
 from starlette.responses import PlainTextResponse, JSONResponse
-from webinterface.common import worker_queue
+from webinterface.common import worker_queue, redis
+from rq import Connection
 from rq import get_current_job
-
+from rq.job import Job
 from .common import router
 logger = config.get_logger()
 
-def test_job(*,accession, node):
+def query_job(*,accession, node):
     config.read_config()
     c = SimpleDicomClient(node.ip, node.port, node.aet_target, config.mercure.incoming_folder)
+    job = get_current_job()
+    job.meta["started"] = 1
+    job.save_meta()
     for identifier in c.getscu(accession):
-        job = get_current_job()
         job.meta['failed'] = identifier.NumberOfFailedSuboperations
         job.meta['remaining'] = identifier.NumberOfRemainingSuboperations
         job.meta['completed'] = identifier.NumberOfCompletedSuboperations
+        if not job.meta.get('total', False):
+            job.meta['total'] = identifier.NumberOfCompletedSuboperations + identifier.NumberOfRemainingSuboperations
+        job.meta["started"] += 1
         job.save_meta()
     return "Complete"
 
+def dummy_job(*,accession, node):
+    total_time = 3  # Total time for the job in seconds (1 minute)
+    update_interval = 1  # Interval between updates in seconds
+
+    start_time = time.monotonic()
+    job = get_current_job()
+    if job.meta.get('parent'):
+        job_parent = worker_queue.fetch_job(job.meta['parent'])
+    else:
+        job_parent = None
+    # failed = 0
+    remaining = total_time // update_interval
+    completed = 0
+    print(accession)
+    if job_parent:
+        job_parent.meta['started'] = job_parent.meta.get('started',0) + 1
+        job_parent.save_meta()
+
+    job.meta['started'] = 1
+    job.meta['total'] = remaining
+    job.meta['progress'] = f"0 / {job.meta['total']}"
+    job.save_meta()
+    while (time.monotonic() - start_time) < total_time:
+        time.sleep(update_interval)  # Sleep for the interval duration
+        remaining -= 1
+        completed += 1
+
+        # job.meta['failed'] = failed
+        job.meta['remaining'] = remaining
+        job.meta['completed'] = completed
+        job.meta['progress'] = f"{completed} / {job.meta['total']}"
+        print(job.meta['progress'])
+        job.save_meta()  # Save the updated meta data to the job
+    
+    if job_parent:
+        job_parent.meta['completed'] += 1
+        job_parent.meta['progress'] = f"{job_parent.meta['completed'] } / {job_parent.meta['total']}"
+
+        job_parent.save_meta()
+    return "Job complete"
+
+def batch_job(*, accessions, subjobs):
+    print(subjobs)
+    return "Batch complete"
+
+def monitor_job():
+    print("monitoring")
+
+@router.get("/query/job_info")
+@requires(["authenticated", "admin"], redirect="login")
+async def get_job_info(request):
+    job_id = request.query_params['id']
+    job = worker_queue.fetch_job(job_id)
+    if not job:
+        return JSONResponse({'error': 'Job not found'}, status_code=404)
+    
+    subjob_info = []
+    for job_id in job.kwargs.get('subjobs',[]):
+        subjob = worker_queue.fetch_job(job_id)
+        if subjob:
+            subjob_info.append({'id': subjob.get_id(),
+                                'ended_at': subjob.ended_at.isoformat().split('.')[0] if subjob.ended_at else "", 
+                                'created_at_dt':subjob.created_at,
+                                'accession': subjob.kwargs['accession'],
+                                'progress': subjob.meta.get('progress'),
+                                'status': subjob.get_status()})
+    subjob_info = sorted(subjob_info, key=lambda x:x['created_at_dt'])
+    return templates.TemplateResponse("dashboards/query_job_fragment.html", {"request":request,"subjob_info":subjob_info})
+
 @router.post("/query")
 @requires(["authenticated", "admin"], redirect="login")
-async def query_post(request):
+async def query_post_batch(request):
+    """
+    Starts a new query job for the given accession number and DICOM node.
+    """
     form = await request.form()
+    for n in config.mercure.dicom_retrieve.dicom_nodes:
+        if n.name == form.get("dicom_node"):
+            node = n
+            break
+    random_accessions = ["".join(random.choices([str(i) for i in range(10)], k=10)) for _ in range(5)]
+    jobs = []
+    with Connection(redis):
+        for accession in random_accessions:
+            job = Job.create(dummy_job, kwargs=dict(accession=accession, node=node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_batch",parent=None))
+            jobs.append(job)
+        full_job = Job.create(batch_job, kwargs=dict(accessions=random_accessions, subjobs=[j.id for j in jobs]), timeout=-1, result_ttl=-1, meta=dict(type="batch", started=0, completed=0, total=len(jobs)), depends_on=[j.id for j in jobs])
+        for j in jobs:
+            j.meta["parent"] = full_job.id
+
+    for j in jobs:
+        worker_queue.enqueue_job(j)
+    worker_queue.enqueue_job(full_job)
 
+    # worker_scheduler.schedule(scheduled_time=datetime.utcnow(), func=monitor_job, interval=10, repeat=10, result_ttl=-1)
+    return PlainTextResponse()
+
+@router.post("/query_single")
+@requires(["authenticated", "admin"], redirect="login")
+async def query_post(request):
+    """
+    Starts a new query job for the given accession number and DICOM node.
+    """
+    form = await request.form()
     for n in config.mercure.dicom_retrieve.dicom_nodes:
         if n.name == form.get("dicom_node"):
             node = n
             break
     
-    worker_queue.enqueue_call(test_job, kwargs=dict(accession=form.get("accession"), node=node), timeout='10m', result_ttl=-1)
+    worker_queue.enqueue_call(query_job, kwargs=dict(accession=form.get("accession"), node=node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_single"))
     return PlainTextResponse()
 
 @router.get("/query/jobs")
@@ -55,12 +160,33 @@ async def query_jobs(request):
     for r in registries:
         for j_id in r.get_job_ids():
             job = worker_queue.fetch_job(j_id)
-            job_info.append(dict(id=j_id, 
+            if job.meta.get('type') != 'batch':
+                continue
+            job_dict = dict(id=j_id, 
                                  status=job.get_status(), 
                                  parameters=dict(accession=job.kwargs.get('accession','')), 
-                                 enqueued_at=1000*datetime.timestamp(job.enqueued_at), 
+                                 created_at=1000*datetime.timestamp(job.created_at) if job.created_at else "",
+                                 enqueued_at=1000*datetime.timestamp(job.enqueued_at) if job.enqueued_at else "", 
                                  result=job.result, 
-                                 meta=job.meta))
+                                 meta=job.meta,
+                                 progress="")
+            # if job.meta.get('completed') and job.meta.get('remaining'):
+            #     job_dict["progress"] = f"{job.meta.get('completed')} / {job.meta.get('completed') + job.meta.get('remaining')}"
+            # if job.meta.get('type',None) == "batch":
+            n_started = job.meta.get('started',0)
+            n_completed = job.meta.get('completed',0)
+            n_total = job.meta.get('total',0)
+
+            if job_dict["status"] == "finished":
+                job_dict["progress"] = f"{n_total} / {n_total}"
+            elif job_dict["status"] in ("deferred","started"):
+                job_dict["progress"] = f"{n_completed} / {n_total}"
+                if 0 < n_started < n_total:
+                    job_dict["status"] = "running"
+                elif n_completed == n_total:
+                    job_dict["status"] = "finishing"
+
+            job_info.append(job_dict)
     return JSONResponse(dict(data=job_info))
     # return PlainTextResponse(",".join([str(j) for j in all_jobs]))
 
diff --git a/webinterface/templates/dashboards/query.html b/webinterface/templates/dashboards/query.html
index 48756c04..f595df46 100644
--- a/webinterface/templates/dashboards/query.html
+++ b/webinterface/templates/dashboards/query.html
@@ -68,9 +68,11 @@ <h1 class="title">DICOM Query</h1>
             <table class="table is-narrow is-hoverable is-fullwidth jobtable" id="casetable">
                 <thead>
                     <tr>
+                        <th></th>
                         <th>id</th>
+                        <th>type</th>
                         <th>status</th>
-                        <th>enqueued_at</th>
+                        <th>created_at</th>
                         <th>accession</th>
                         <th>result</th>
                         <th>progress</th>
@@ -93,14 +95,22 @@ <h1 class="title">DICOM Query</h1>
         ajax: "query/jobs",
         deferRender: true,
         columns: [
+            {
+                className: 'dt-control',
+                orderable: false,
+                data: null,
+                defaultContent: ''
+            },
             { data: 'id' },
+            { data: 'meta', render: data => data["type"]? data["type"]:"" },
             { data: 'status' },
-            { data: 'enqueued_at', render: data => `<span style="display:none;">${data}</span>`+new Date(data).toLocaleString("en-US")},
+            { data: 'created_at', render: data => `<span style="display:none;">${data || Date.now()  }</span>`+(data? new Date(data).toLocaleString("en-US"):"")},
             { data: 'parameters', render: data => data["accession"] || ""},
             { data: 'result' },
-            { data: 'meta', render: data => data["completed"]?`${data["completed"]}/${data["remaining"]+data["completed"]}`:"" },
+            { data: 'progress'},
         ],
         select: {
+            selector:'td:not(:first-child)',
             style: 'os'
         },
         language: {
@@ -108,10 +118,28 @@ <h1 class="title">DICOM Query</h1>
         },
         // filter: true,
         buttons: [],
-        order: [[2, 'desc']],
+        order: [[4, 'desc']],
         initComplete: function() {             
         }
     });
+    window.datatable.on('click', 'td.dt-control', function (e) {
+      let tr = e.target.closest('tr');
+      let row = window.datatable.row(tr);
+  
+      if (row.child.isShown()) {
+          // This row is already open - close it
+          row.child.hide();
+      }
+      else {
+          // Open this row
+          fetch("query/job_info?id="+row.data().id, {method: "GET"}
+            ).then(
+              response => response.text()
+            ).then(data=>{
+              row.child(data).show();
+            });
+      }
+  });
 });
 </script>
 {% endblock %}
\ No newline at end of file
diff --git a/webinterface/templates/dashboards/query_job_fragment.html b/webinterface/templates/dashboards/query_job_fragment.html
new file mode 100644
index 00000000..36314c81
--- /dev/null
+++ b/webinterface/templates/dashboards/query_job_fragment.html
@@ -0,0 +1,29 @@
+<table>
+    <tr>
+        <th>
+        </th>
+        <th>
+            Accession
+        </th>
+        <th>
+            Ended at
+        </th>
+        <th>
+            Status
+        </th>
+        <th>
+            Progress
+        </th>
+    </tr>
+
+    </th>
+    {% for job in subjob_info %}
+    <tr>
+        <td></td>
+        <td>{{job['accession']}}</td>
+        <td>{{job['ended_at'] or ''}}</td>
+        <td>{{job['status']}}</td>
+        <td>{{job['progress'] or ''}}</td>
+    </tr>
+    {% endfor %}
+</table>
\ No newline at end of file

From 48205eb862a925e08389a55651ecd78294423556 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 28 Jun 2024 17:57:21 +0000
Subject: [PATCH 14/42] create dummy files

---
 webinterface/dashboards/query.py | 15 ++++++++++++---
 1 file changed, 12 insertions(+), 3 deletions(-)

diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
index 8dd692de..81170039 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query.py
@@ -1,4 +1,6 @@
 
+from pathlib import Path
+import shutil
 from webinterface.query import SimpleDicomClient
 # Standard python includes
 from datetime import datetime
@@ -34,7 +36,8 @@ def query_job(*,accession, node):
         job.save_meta()
     return "Complete"
 
-def dummy_job(*,accession, node):
+def dummy_job(*,accession, node, path):
+    Path(path).mkdir(parents=True, exist_ok=True)
     total_time = 3  # Total time for the job in seconds (1 minute)
     update_interval = 1  # Interval between updates in seconds
 
@@ -58,6 +61,7 @@ def dummy_job(*,accession, node):
     job.save_meta()
     while (time.monotonic() - start_time) < total_time:
         time.sleep(update_interval)  # Sleep for the interval duration
+        (Path(path) / f"dummy{completed}_{job.id}.dcm").touch()
         remaining -= 1
         completed += 1
 
@@ -75,8 +79,10 @@ def dummy_job(*,accession, node):
         job_parent.save_meta()
     return "Job complete"
 
-def batch_job(*, accessions, subjobs):
-    print(subjobs)
+def batch_job(*, accessions, subjobs, path):
+    for p in Path(path).glob("**/*.dcm"):
+        shutil.move(p, "/opt/mercure/data/incoming")
+    shutil.rmtree(path)
     return "Batch complete"
 
 def monitor_job():
@@ -123,6 +129,9 @@ async def query_post_batch(request):
         full_job = Job.create(batch_job, kwargs=dict(accessions=random_accessions, subjobs=[j.id for j in jobs]), timeout=-1, result_ttl=-1, meta=dict(type="batch", started=0, completed=0, total=len(jobs)), depends_on=[j.id for j in jobs])
         for j in jobs:
             j.meta["parent"] = full_job.id
+            j.kwargs["path"] = f"/opt/mercure/data/query/job_dirs/{full_job.id}/{j.kwargs['accession']}"
+        full_job.kwargs["path"] = Path(f"/opt/mercure/data/query/job_dirs/{full_job.id}")
+
 
     for j in jobs:
         worker_queue.enqueue_job(j)

From e12ac9c6c3e8d0ce7e49ea79f8e87ded4d8e4748 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 28 Jun 2024 17:57:21 +0000
Subject: [PATCH 15/42] - pause/resume jobs - redirect results to folder

---
 common/types.py                              |   7 +-
 webinterface/common.py                       |   3 +
 webinterface/dashboards/query.py             | 200 ++++++++++++++-----
 webinterface/templates/dashboards/query.html |  95 ++++++++-
 4 files changed, 248 insertions(+), 57 deletions(-)

diff --git a/common/types.py b/common/types.py
index 9558db6c..aaba7738 100755
--- a/common/types.py
+++ b/common/types.py
@@ -185,9 +185,14 @@ class DicomNode(BaseModel):
     aet_target: str
     aet_source: Optional[str] = ""
 
+class DicomDestination(BaseModel):
+    name: str
+    path: str
+
 class DicomRetrieveConfig(BaseModel):
     dicom_nodes: List[DicomNode] = []
-
+    destination_folders: List[DicomDestination] = []
+    
 class Config(BaseModel, Compat):
     appliance_name: str
     port: int
diff --git a/webinterface/common.py b/webinterface/common.py
index 25a35efd..d0692a89 100755
--- a/webinterface/common.py
+++ b/webinterface/common.py
@@ -17,6 +17,9 @@
 from rq_scheduler import Scheduler
 
 redis = Redis()
+
+
+
 worker_queue = Queue(connection=redis)
 worker_scheduler = Scheduler(queue=worker_queue, connection=worker_queue.connection) 
 
diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
index 81170039..eca892da 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query.py
@@ -20,6 +20,8 @@
 from .common import router
 logger = config.get_logger()
 
+
+
 def query_job(*,accession, node):
     config.read_config()
     c = SimpleDicomClient(node.ip, node.port, node.aet_target, config.mercure.incoming_folder)
@@ -36,9 +38,10 @@ def query_job(*,accession, node):
         job.save_meta()
     return "Complete"
 
+
 def dummy_job(*,accession, node, path):
     Path(path).mkdir(parents=True, exist_ok=True)
-    total_time = 3  # Total time for the job in seconds (1 minute)
+    total_time = 10  # Total time for the job in seconds (1 minute)
     update_interval = 1  # Interval between updates in seconds
 
     start_time = time.monotonic()
@@ -61,7 +64,10 @@ def dummy_job(*,accession, node, path):
     job.save_meta()
     while (time.monotonic() - start_time) < total_time:
         time.sleep(update_interval)  # Sleep for the interval duration
-        (Path(path) / f"dummy{completed}_{job.id}.dcm").touch()
+        out_file = (Path(path) / f"dummy{completed}_{job.id}.dcm")
+        if out_file.exists():
+            raise Exception(f"{out_file} exists already")
+        out_file.touch()
         remaining -= 1
         completed += 1
 
@@ -73,21 +79,82 @@ def dummy_job(*,accession, node, path):
         job.save_meta()  # Save the updated meta data to the job
     
     if job_parent:
+        job_parent.get_meta() # there is technically a race condition here...
         job_parent.meta['completed'] += 1
-        job_parent.meta['progress'] = f"{job_parent.meta['completed'] } / {job_parent.meta['total']}"
+        job_parent.meta['progress'] = f"{job_parent.meta['started'] } / {job_parent.meta['completed'] } / {job_parent.meta['total']}"
 
         job_parent.save_meta()
     return "Job complete"
 
-def batch_job(*, accessions, subjobs, path):
-    for p in Path(path).glob("**/*.dcm"):
-        shutil.move(p, "/opt/mercure/data/incoming")
+def batch_job(*, accessions, subjobs, path, destination):
+    job = get_current_job()
+    job.save_meta()
+    logger.info(f"Job completing {job.id}")
+    logger.info(path)
+    if destination is None:
+        for p in Path(path).glob("**/*"):
+            if p.is_file():
+                shutil.move(p, config.mercure.incoming_folder)
+    else:
+        dest_folder: Path = Path(destination) / job.id
+        dest_folder.mkdir()
+        for p in Path(path).iterdir():
+            if p.is_dir():
+                logger.info(f"moving {p} to {dest_folder}")
+                shutil.move(p, dest_folder)
+
     shutil.rmtree(path)
-    return "Batch complete"
+    return "Job complete"
+
+
 
 def monitor_job():
     print("monitoring")
 
+@router.post("/query/pause_job")
+@requires(["authenticated", "admin"], redirect="login")
+async def pause_job(request):
+    job = worker_queue.fetch_job(request.query_params['id'])
+    if not job:
+        return JSONResponse({'error': 'Job not found'}, status_code=404)
+    if job.is_finished or job.is_failed:
+        return JSONResponse({'error': 'Job is already finished'}, status_code=400)
+
+    for job_id in job.kwargs.get('subjobs',[]):
+        subjob = worker_queue.fetch_job(job_id)
+        if subjob and (subjob.is_deferred or subjob.is_queued):
+            subjob.meta['paused'] = True
+            subjob.save_meta()
+            subjob.cancel()
+    job.meta['paused'] = True
+    job.save_meta()
+    return JSONResponse({'status': 'success'}, status_code=200)
+
+@router.post("/query/resume_job")
+@requires(["authenticated", "admin"], redirect="login")
+async def resume_job(request):
+    job = worker_queue.fetch_job(request.query_params['id'])
+    if not job:
+        return JSONResponse({'error': 'Job not found'}, status_code=404)
+    if job.is_finished or job.is_failed:
+        return JSONResponse({'error': 'Job is already finished'}, status_code=400)
+    # if not job.meta.get('paused', False):
+    #     return JSONResponse({'error': 'Job is not paused'}, status_code=400)
+
+    for subjob_id in job.kwargs.get('subjobs',[]):
+        subjob = worker_queue.fetch_job(subjob_id)
+        if subjob and subjob.meta.get('paused', None):
+            subjob.meta['paused'] = False
+            subjob.save_meta()
+            worker_queue.canceled_job_registry.requeue(subjob_id)
+            # worker_queue.canceled_job_registry.remove(subjob_id)
+    job.get_meta()
+    job.meta['paused'] = False
+    job.save_meta()
+    # worker_queue.canceled_job_registry.requeue(job.id)
+    # worker_queue.canceled_job_registry.remove(job.id)
+    return JSONResponse({'status': 'success'}, status_code=200)
+
 @router.get("/query/job_info")
 @requires(["authenticated", "admin"], redirect="login")
 async def get_job_info(request):
@@ -97,17 +164,21 @@ async def get_job_info(request):
         return JSONResponse({'error': 'Job not found'}, status_code=404)
     
     subjob_info = []
-    for job_id in job.kwargs.get('subjobs',[]):
-        subjob = worker_queue.fetch_job(job_id)
-        if subjob:
-            subjob_info.append({'id': subjob.get_id(),
-                                'ended_at': subjob.ended_at.isoformat().split('.')[0] if subjob.ended_at else "", 
-                                'created_at_dt':subjob.created_at,
-                                'accession': subjob.kwargs['accession'],
-                                'progress': subjob.meta.get('progress'),
-                                'status': subjob.get_status()})
+    subjobs = (worker_queue.fetch_job(job) for job in job.kwargs.get('subjobs', []))
+    for subjob in subjobs:
+        info = {'id': subjob.get_id(),
+                'ended_at': subjob.ended_at.isoformat().split('.')[0] if subjob.ended_at else "", 
+                'created_at_dt':subjob.created_at,
+                'accession': subjob.kwargs['accession'],
+                'progress': subjob.meta.get('progress'),
+                'paused': subjob.meta.get('paused',False),
+                'status': subjob.get_status()
+            }
+        if info['status'] == 'canceled' and info['paused']:
+            info['status'] = 'paused'
+        subjob_info.append(info)
     subjob_info = sorted(subjob_info, key=lambda x:x['created_at_dt'])
-    return templates.TemplateResponse("dashboards/query_job_fragment.html", {"request":request,"subjob_info":subjob_info})
+    return templates.TemplateResponse("dashboards/query_job_fragment.html", {"request":request,"job":job,"subjob_info":subjob_info})
 
 @router.post("/query")
 @requires(["authenticated", "admin"], redirect="login")
@@ -120,18 +191,22 @@ async def query_post_batch(request):
         if n.name == form.get("dicom_node"):
             node = n
             break
-    random_accessions = ["".join(random.choices([str(i) for i in range(10)], k=10)) for _ in range(5)]
+    destination = form.get("destination")
+    for d in config.mercure.dicom_retrieve.destination_folders:
+        if d.name == destination:
+            destination_path = d.path
+    random_accessions = ["".join(random.choices([str(i) for i in range(10)], k=5)) for _ in range(3)]
     jobs = []
     with Connection(redis):
         for accession in random_accessions:
-            job = Job.create(dummy_job, kwargs=dict(accession=accession, node=node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_batch",parent=None))
+            job = Job.create(dummy_job, kwargs=dict(accession=accession, node=node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_batch",parent=None, paused=False))
             jobs.append(job)
-        full_job = Job.create(batch_job, kwargs=dict(accessions=random_accessions, subjobs=[j.id for j in jobs]), timeout=-1, result_ttl=-1, meta=dict(type="batch", started=0, completed=0, total=len(jobs)), depends_on=[j.id for j in jobs])
+        full_job = Job.create(batch_job, kwargs=dict(accessions=random_accessions, subjobs=[j.id for j in jobs], destination=destination_path), timeout=-1, result_ttl=-1, meta=dict(type="batch", started=0, paused=False,completed=0, total=len(jobs)), depends_on=[j.id for j in jobs])
         for j in jobs:
             j.meta["parent"] = full_job.id
             j.kwargs["path"] = f"/opt/mercure/data/query/job_dirs/{full_job.id}/{j.kwargs['accession']}"
         full_job.kwargs["path"] = Path(f"/opt/mercure/data/query/job_dirs/{full_job.id}")
-
+        full_job.kwargs["path"].mkdir(parents=True)
 
     for j in jobs:
         worker_queue.enqueue_job(j)
@@ -164,38 +239,59 @@ async def query_jobs(request):
         worker_queue.finished_job_registry,  # Returns FinishedJobRegistry
         worker_queue.failed_job_registry,  # Returns FailedJobRegistry 
         worker_queue.scheduled_job_registry,  # Returns ScheduledJobRegistry
+        worker_queue.canceled_job_registry,   # Returns CanceledJobRegistry
     ]
     job_info = []
-    for r in registries:
-        for j_id in r.get_job_ids():
-            job = worker_queue.fetch_job(j_id)
-            if job.meta.get('type') != 'batch':
-                continue
-            job_dict = dict(id=j_id, 
-                                 status=job.get_status(), 
-                                 parameters=dict(accession=job.kwargs.get('accession','')), 
-                                 created_at=1000*datetime.timestamp(job.created_at) if job.created_at else "",
-                                 enqueued_at=1000*datetime.timestamp(job.enqueued_at) if job.enqueued_at else "", 
-                                 result=job.result, 
-                                 meta=job.meta,
-                                 progress="")
-            # if job.meta.get('completed') and job.meta.get('remaining'):
-            #     job_dict["progress"] = f"{job.meta.get('completed')} / {job.meta.get('completed') + job.meta.get('remaining')}"
-            # if job.meta.get('type',None) == "batch":
-            n_started = job.meta.get('started',0)
-            n_completed = job.meta.get('completed',0)
-            n_total = job.meta.get('total',0)
-
-            if job_dict["status"] == "finished":
-                job_dict["progress"] = f"{n_total} / {n_total}"
-            elif job_dict["status"] in ("deferred","started"):
-                job_dict["progress"] = f"{n_completed} / {n_total}"
-                if 0 < n_started < n_total:
-                    job_dict["status"] = "running"
-                elif n_completed == n_total:
-                    job_dict["status"] = "finishing"
-
-            job_info.append(job_dict)
+    # logger.info(worker_queue.job_ids)
+    # for registry in registries:
+    job_ids = set()
+    for registry in registries:
+        for j_id in registry.get_job_ids():
+            job_ids.add(j_id)
+    for j_id in worker_queue.job_ids:
+        job_ids.add(j_id)
+
+    for j_id in job_ids:
+        job = worker_queue.fetch_job(j_id)
+        job_meta = job.get_meta()
+        if job_meta.get('type') != 'batch':
+            continue
+        job_dict = dict(id=j_id, 
+                                status=job.get_status(), 
+                                parameters=dict(accession=job.kwargs.get('accession','')), 
+                                created_at=1000*datetime.timestamp(job.created_at) if job.created_at else "",
+                                enqueued_at=1000*datetime.timestamp(job.enqueued_at) if job.enqueued_at else "", 
+                                result=job.result, 
+                                meta=job_meta,
+                                progress="")
+        # if job.meta.get('completed') and job.meta.get('remaining'):
+        #     job_dict["progress"] = f"{job.meta.get('completed')} / {job.meta.get('completed') + job.meta.get('remaining')}"
+        # if job.meta.get('type',None) == "batch":
+        n_started = job_meta.get('started',0)
+        n_completed = job_meta.get('completed',0)
+        n_total = job_meta.get('total',0)
+
+        if job_dict["status"] == "finished":
+            job_dict["progress"] = f"{n_total} / {n_total}"
+        elif job_dict["status"] in ("deferred","started", "paused", "canceled"):
+            job_dict["progress"] = f"{n_completed} / {n_total}"
+        
+        # if job_dict["status"] == "canceled" and 
+        if job_dict["meta"].get('paused', False):
+            if n_started < n_completed: # TODO: this does not work
+                job_dict["status"] = "pausing"
+            else:
+                job_dict["status"] = "paused"
+
+        if job_dict["status"] in ("deferred", "started"):
+            if n_started == 0:
+                job_dict["status"] = "waiting"
+            elif n_completed < n_total:
+                job_dict["status"] = "running"
+            elif n_completed == n_total:
+                job_dict["status"] = "finishing"
+
+        job_info.append(job_dict)
     return JSONResponse(dict(data=job_info))
     # return PlainTextResponse(",".join([str(j) for j in all_jobs]))
 
@@ -205,7 +301,7 @@ async def query(request):
     template = "dashboards/query.html"
     context = {
         "request": request,
-        
+        "destination_folders": config.mercure.dicom_retrieve.destination_folders,
         "dicom_nodes": config.mercure.dicom_retrieve.dicom_nodes,
         "page": "query",
     }
diff --git a/webinterface/templates/dashboards/query.html b/webinterface/templates/dashboards/query.html
index f595df46..085cc209 100644
--- a/webinterface/templates/dashboards/query.html
+++ b/webinterface/templates/dashboards/query.html
@@ -44,7 +44,26 @@ <h1 class="title">DICOM Query</h1>
                 </div>
               </div>
             </div>
-
+            <div class="field is-horizontal">
+              <div class="field-label is-normal">
+                <label class="label">Destination</label>
+              </div>
+              <div class="field-body">
+                <div class="field">
+                  <div class="control is-expanded">
+                    <div class="select">
+                        <select name="destination">
+                          <option>Mercure</option>
+                          <option disabled>————————</option>
+                          {% for destination in destination_folders %}
+                          <option>{{ destination.name }}</option>
+                          {% endfor %}
+                        </select>
+                      </div>
+                  </div>
+                </div>
+              </div>
+            </div>
             <div class="field is-horizontal">
               <div class="field-label">
                 <!-- Left empty for spacing -->
@@ -59,7 +78,6 @@ <h1 class="title">DICOM Query</h1>
                 </div>
               </div>
             </div>
-          </div> 
           </form>
           <div id="query_result"></div>
         <div class="columns">
@@ -84,12 +102,45 @@ <h1 class="title">DICOM Query</h1>
             </div>
             </div>
     </div>
+  </div> 
+
 </main>
 <script>
 $(document).ready(function () {      
     $("#form").on('htmx:afterOnLoad', (event) => {
         datatable.ajax.reload();
-});
+  });
+
+  function namespacedEvents(config) {
+        var unique = config._eventNamespace;
+        return 'draw.dt.DT' + unique + ' select.dt.DT' + unique + ' deselect.dt.DT' + unique;
+  }
+    var _buttonNamespace = 0;
+    my_selected_button = {
+		text: 'Selected',
+		className: 'buttons-selected',
+        enabled: function(dt,config) {
+           rows = dt.rows({ selected: true });
+           return rows.any();
+        },
+		init: function (dt, node, config) {
+			var that = this;
+			config._eventNamespace = '.select' + _buttonNamespace++;
+			// .DT namespace listeners are removed by DataTables automatically
+			// on table destroy
+      // console.log(config);
+			dt.on(namespacedEvents(config), function () {
+				that.enable(config.enabled(dt, node, config));
+			});
+
+			this.disable();
+		},
+		destroy: function (dt, node, config) {
+			dt.off(config._eventNamespace);
+		}}
+
+    $.fn.dataTable.ext.buttons.customEnable = my_selected_button;
+
     window.datatable = $('#casetable').DataTable({           
         dom: "<'row browsertoolbar align-items-end'<'col-sm-12 col-md-7 browserbuttons'B><'col-sm-12 col-md-2'><'col-sm-12 col-md-3'f>>" + "<'row'<'col-sm-12'tr>>" + "<'row browserfooterbar'<'col-sm-12 col-md-5'l><'col-sm-12 col-md-7'p>>",
         ajax: "query/jobs",
@@ -117,7 +168,43 @@ <h1 class="title">DICOM Query</h1>
             "emptyTable": "No messages available on server."
         },
         // filter: true,
-        buttons: [],
+        buttons: [
+          {
+                    extend: "customEnable",
+                    text: '<i class="fas fa-pause"></i>',
+                    titleAttr: 'Pause/Resume',
+                    enabled: function(dt, node, config) {
+                      let data = dt.row({selected: true}).data();
+                      console.log(node);
+                      if (!data) {
+                          return false;
+                      }
+                      if (data.status == "paused") {
+                        node.html('<i class="fas fa-play"></i>')
+                      } else {
+                        node.html('<i class="fas fa-pause"></i>')
+                      }
+                      return (data.status == "paused" || data.status == "deferred" || data.status == "queued" || data.status == "running");
+                    },
+                    action: function (e, dt, node, config) {
+                        let data = dt.row({selected: true}).data();
+                        
+                        if (data.status == "paused") {
+                          operation = "resume";
+                        } else if (data.status == "deferred" || data.status == "running" || data.status == "queued")  {
+                          operation = "pause";
+                        } else {
+                          alert("???");
+                          return;
+                        }
+                        fetch(`query/${operation}_job?id=${data.id}`, {method:"POST"}).then(()=>{
+                            dt.ajax.reload()
+                        }).catch((err)=>{
+                            console.log("Error: ", err)
+                        })
+                    }
+                },
+        ],
         order: [[4, 'desc']],
         initComplete: function() {             
         }

From fff8ab734e5cb69b81561c80b3e27fc602f61eb9 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 28 Jun 2024 17:57:48 +0000
Subject: [PATCH 16/42] - batch jobs fail if a subjob fails - retry failed jobs
 - offpeak-only jobs

---
 requirements.in                              |   2 +-
 requirements.txt                             |  24 +-
 webgui.py                                    |  12 +
 webinterface/dashboards/query.py             | 338 ++++++++++++-------
 webinterface/templates/dashboards/query.html |  39 ++-
 5 files changed, 280 insertions(+), 135 deletions(-)

diff --git a/requirements.in b/requirements.in
index 62c8df45..00beeb85 100644
--- a/requirements.in
+++ b/requirements.in
@@ -31,7 +31,7 @@ aiofiles
 jinja2
 types-Jinja2
 # 0.15.0 breaks session management; the next commit after 0.18 will include the fix
-starlette ~= 0.28; 
+starlette ~= 0.28
 starlette-auth-toolkit
 uvicorn == 0.16.0
 itsdangerous
diff --git a/requirements.txt b/requirements.txt
index a2f6d411..c3121103 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,9 +1,5 @@
-#
-# This file is autogenerated by pip-compile with Python 3.10
-# by the following command:
-#
-#    pip-compile
-#
+# This file was autogenerated by uv via the following command:
+#    uv pip compile requirements.in -o requirements.txt --no-strip-extras
 aiofiles==23.2.1
     # via -r requirements.in
 aiohttp==3.9.5
@@ -49,6 +45,8 @@ click==8.1.7
     # via
     #   rq
     #   uvicorn
+crontab==1.0.1
+    # via rq-scheduler
 daiquiri==3.2.5.1
     # via -r requirements.in
 databases[aiopg]==0.8.0
@@ -67,8 +65,10 @@ exceptiongroup==1.2.1
     # via
     #   anyio
     #   pytest
-freezegun==1.5.1
-    # via -r requirements.in
+freezegun==1.4.0
+    # via
+    #   -r requirements.in
+    #   rq-scheduler
 frozenlist==1.4.1
     # via
     #   aiohttp
@@ -168,6 +168,7 @@ python-dateutil==2.9.0.post0
     #   botocore
     #   freezegun
     #   influxdb-client
+    #   rq-scheduler
 python-json-logger==2.0.7
     # via daiquiri
 python-multipart==0.0.9
@@ -185,6 +186,10 @@ retrying==1.3.4
     # via dicomweb-client
 s3transfer==0.10.1
 rq==1.16.2
+    # via
+    #   -r requirements.in
+    #   rq-scheduler
+rq-scheduler==0.13.1
     # via -r requirements.in
 six==1.16.0
     # via
@@ -264,6 +269,3 @@ wheel==0.43.0
     # via -r requirements.in
 yarl==1.9.4
     # via aiohttp
-
-# The following packages are considered to be unsafe in a requirements file:
-# setuptools
diff --git a/webgui.py b/webgui.py
index 41ff981e..d41d11aa 100755
--- a/webgui.py
+++ b/webgui.py
@@ -127,6 +127,18 @@ async def authenticate(self, request):
 
 
 def startup() -> None:
+    scheduled_jobs = worker_scheduler.get_jobs()
+    for job in scheduled_jobs: 
+        if job.meta.get("type") != "offpeak":
+            continue
+        worker_scheduler.cancel(job)
+    worker_scheduler.schedule(
+        scheduled_time=datetime.datetime.utcnow(),
+        func=dashboards.query.update_jobs_offpeak,
+        interval=60,
+        meta={"type": "offpeak"},
+        repeat=None
+    )
     monitor.configure("webgui", "main", config.mercure.bookkeeper)
     monitor.send_event(monitor.m_events.BOOT, monitor.severity.INFO, f"PID = {os.getpid()}")
 
diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
index eca892da..ddd4dc6c 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query.py
@@ -14,7 +14,8 @@
 import common.config as config
 from starlette.responses import PlainTextResponse, JSONResponse
 from webinterface.common import worker_queue, redis
-from rq import Connection
+from rq import Connection 
+from rq.job import Dependency
 from rq import get_current_job
 from rq.job import Job
 from .common import router
@@ -40,57 +41,81 @@ def query_job(*,accession, node):
 
 
 def dummy_job(*,accession, node, path):
-    Path(path).mkdir(parents=True, exist_ok=True)
-    total_time = 10  # Total time for the job in seconds (1 minute)
-    update_interval = 1  # Interval between updates in seconds
-
-    start_time = time.monotonic()
+    print(f"Getting {accession}")
     job = get_current_job()
-    if job.meta.get('parent'):
-        job_parent = worker_queue.fetch_job(job.meta['parent'])
-    else:
-        job_parent = None
-    # failed = 0
-    remaining = total_time // update_interval
-    completed = 0
-    print(accession)
-    if job_parent:
-        job_parent.meta['started'] = job_parent.meta.get('started',0) + 1
-        job_parent.save_meta()
-
-    job.meta['started'] = 1
-    job.meta['total'] = remaining
-    job.meta['progress'] = f"0 / {job.meta['total']}"
-    job.save_meta()
-    while (time.monotonic() - start_time) < total_time:
-        time.sleep(update_interval)  # Sleep for the interval duration
-        out_file = (Path(path) / f"dummy{completed}_{job.id}.dcm")
-        if out_file.exists():
-            raise Exception(f"{out_file} exists already")
-        out_file.touch()
-        remaining -= 1
-        completed += 1
-
-        # job.meta['failed'] = failed
-        job.meta['remaining'] = remaining
-        job.meta['completed'] = completed
-        job.meta['progress'] = f"{completed} / {job.meta['total']}"
-        print(job.meta['progress'])
-        job.save_meta()  # Save the updated meta data to the job
-    
-    if job_parent:
-        job_parent.get_meta() # there is technically a race condition here...
-        job_parent.meta['completed'] += 1
-        job_parent.meta['progress'] = f"{job_parent.meta['started'] } / {job_parent.meta['completed'] } / {job_parent.meta['total']}"
+    try:
+        Path(path).mkdir(parents=True, exist_ok=True)
+        total_time = 10  # Total time for the job in seconds (1 minute)
+        update_interval = 1  # Interval between updates in seconds
+
+        start_time = time.monotonic()
+        if job.meta.get('parent'):
+            job_parent = worker_queue.fetch_job(job.meta['parent'])
+        else:
+            job_parent = None
+        # failed = 0
+        remaining = total_time // update_interval
+        completed = 0
+
+        if job_parent:
+            job_parent.meta['started'] = job_parent.meta.get('started',0) + 1
+            job_parent.save_meta()
+
+        job.meta['started'] = 1
+        job.meta['total'] = remaining
+        job.meta['progress'] = f"0 / {job.meta['total']}"
+        job.save_meta()
+        while (time.monotonic() - start_time) < total_time:
+            time.sleep(update_interval)  # Sleep for the interval duration
+            out_file = (Path(path) / f"dummy{completed}_{job.id}.dcm")
+            if out_file.exists():
+                raise Exception(f"{out_file} exists already")
+            out_file.touch()
+            remaining -= 1
+            completed += 1
+
+            # job.meta['failed'] = failed
+            job.meta['remaining'] = remaining
+            job.meta['completed'] = completed
+            job.meta['progress'] = f"{completed} / {job.meta['total']}"
+            print(job.meta['progress'])
+            job.save_meta()  # Save the updated meta data to the job
+        
+        if job_parent:
+            job_parent.get_meta() # there is technically a race condition here...
+            job_parent.meta['completed'] += 1
+            job_parent.meta['progress'] = f"{job_parent.meta['started'] } / {job_parent.meta['completed'] } / {job_parent.meta['total']}"
+
+            job_parent.save_meta()
+    except:
+        if not job_parent:
+            raise
+        # Cancel remaining sibling jobs
+        logger.info("Cancelling sibling jobs.")
+        for subjob_id in job_parent.kwargs.get('subjobs',[]):
+            if subjob_id == job.id:
+                continue
+            subjob = worker_queue.fetch_job(subjob_id)
+            if subjob.get_status() not in ('finished', 'canceled','failed'):
+                subjob.cancel()
+        job_parent.get_meta() 
+        logger.info("Cancelled sibling jobs.")
+        worker_queue._enqueue_job(job_parent) # Force the parent job to run and fail itself
+        raise
 
-        job_parent.save_meta()
     return "Job complete"
 
 def batch_job(*, accessions, subjobs, path, destination):
     job = get_current_job()
-    job.save_meta()
+    job.get_meta()
+    for job_id in job.kwargs.get('subjobs',[]):
+        subjob = worker_queue.fetch_job(job_id)
+        if (status := subjob.get_status()) != 'finished':
+            raise Exception(f"Subjob {subjob.id} is {status}")
+
     logger.info(f"Job completing {job.id}")
     logger.info(path)
+    config.read_config()
     if destination is None:
         for p in Path(path).glob("**/*"):
             if p.is_file():
@@ -111,48 +136,147 @@ def batch_job(*, accessions, subjobs, path, destination):
 def monitor_job():
     print("monitoring")
 
-@router.post("/query/pause_job")
-@requires(["authenticated", "admin"], redirect="login")
-async def pause_job(request):
-    job = worker_queue.fetch_job(request.query_params['id'])
-    if not job:
-        return JSONResponse({'error': 'Job not found'}, status_code=404)
-    if job.is_finished or job.is_failed:
-        return JSONResponse({'error': 'Job is already finished'}, status_code=400)
-
+def pause_job(job: Job):
     for job_id in job.kwargs.get('subjobs',[]):
         subjob = worker_queue.fetch_job(job_id)
         if subjob and (subjob.is_deferred or subjob.is_queued):
             subjob.meta['paused'] = True
             subjob.save_meta()
             subjob.cancel()
+    job.get_meta()
     job.meta['paused'] = True
     job.save_meta()
-    return JSONResponse({'status': 'success'}, status_code=200)
-
-@router.post("/query/resume_job")
-@requires(["authenticated", "admin"], redirect="login")
-async def resume_job(request):
-    job = worker_queue.fetch_job(request.query_params['id'])
-    if not job:
-        return JSONResponse({'error': 'Job not found'}, status_code=404)
-    if job.is_finished or job.is_failed:
-        return JSONResponse({'error': 'Job is already finished'}, status_code=400)
-    # if not job.meta.get('paused', False):
-    #     return JSONResponse({'error': 'Job is not paused'}, status_code=400)
 
+def resume_job(job: Job):
     for subjob_id in job.kwargs.get('subjobs',[]):
         subjob = worker_queue.fetch_job(subjob_id)
         if subjob and subjob.meta.get('paused', None):
             subjob.meta['paused'] = False
             subjob.save_meta()
             worker_queue.canceled_job_registry.requeue(subjob_id)
-            # worker_queue.canceled_job_registry.remove(subjob_id)
     job.get_meta()
     job.meta['paused'] = False
     job.save_meta()
-    # worker_queue.canceled_job_registry.requeue(job.id)
-    # worker_queue.canceled_job_registry.remove(job.id)
+
+def create_job(accessions, dicom_node, destination_path, offpeak=False) -> Job:
+    with Connection(redis):
+        jobs = []
+        for accession in accessions:
+            job = Job.create(dummy_job, kwargs=dict(accession=accession, node=dicom_node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_batch",parent=None, paused=False, offpeak=offpeak))
+            jobs.append(job)
+        depends = Dependency(
+            jobs=jobs,
+            allow_failure=True,    # allow_failure defaults to False
+        )
+        full_job = Job.create(batch_job, kwargs=dict(accessions=accessions, subjobs=[j.id for j in jobs], destination=destination_path), timeout=-1, result_ttl=-1, meta=dict(type="batch", started=0, paused=False,completed=0, total=len(jobs), offpeak=offpeak), depends_on=depends)
+        for j in jobs:
+            j.meta["parent"] = full_job.id
+            j.kwargs["path"] = f"/opt/mercure/data/query/job_dirs/{full_job.id}/{j.kwargs['accession']}"
+        full_job.kwargs["path"] = Path(f"/opt/mercure/data/query/job_dirs/{full_job.id}")
+        full_job.kwargs["path"].mkdir(parents=True)
+    for j in jobs:
+        worker_queue.enqueue_job(j)
+    worker_queue.enqueue_job(full_job)
+
+    if offpeak and not _is_offpeak(config.mercure.offpeak_start, config.mercure.offpeak_end, datetime.now().time()):
+        pause_job(full_job)
+
+    return full_job
+
+def retry_job(job):
+    # job.meta["retries"] = job.meta.get("retries", 0) + 1
+    # if job.meta["retries"] > 3:
+    #     return False
+    logger.info(f"Retrying {job}")
+    for subjob in get_subjobs(job):
+        if (status:=job.get_status()) in ("failed", "canceled"):
+            logger.info(f"Retrying {subjob}")
+            if status == "failed" and (job_path:=Path(subjob.kwargs['path'])).exists():
+                shutil.rmtree(job_path) # Clean up after a failed job
+            worker_queue.enqueue_job(subjob)
+    worker_queue.enqueue_job(job)
+def get_subjobs(job):
+    return (worker_queue.fetch_job(job) for job in job.kwargs.get('subjobs', []))
+
+def get_all_jobs(type):
+    registries = [
+        worker_queue.started_job_registry,  # Returns StartedJobRegistry
+        worker_queue.deferred_job_registry,   # Returns DeferredJobRegistry
+        worker_queue.finished_job_registry,  # Returns FinishedJobRegistry
+        worker_queue.failed_job_registry,  # Returns FailedJobRegistry 
+        worker_queue.scheduled_job_registry,  # Returns ScheduledJobRegistry
+        worker_queue.canceled_job_registry,   # Returns CanceledJobRegistry
+    ]
+    job_ids = set()
+    for registry in registries:
+        for j_id in registry.get_job_ids():
+            job_ids.add(j_id)
+    for j_id in worker_queue.job_ids:
+        job_ids.add(j_id)
+    jobs = (worker_queue.fetch_job(j_id) for j_id in job_ids)
+
+    return (j for j in jobs if j.get_meta().get("type") == type)
+
+def _is_offpeak(offpeak_start: str, offpeak_end: str, current_time) -> bool:
+    try:
+        start_time = datetime.strptime(offpeak_start, "%H:%M").time()
+        end_time = datetime.strptime(offpeak_end, "%H:%M").time()
+    except Exception as e:
+        logger.error(f"Unable to parse offpeak time: {offpeak_start}, {offpeak_end}", None)  # handle_error
+        return True
+
+    if start_time < end_time:
+        return current_time >= start_time and current_time <= end_time
+    # End time is after midnight
+    return current_time >= start_time or current_time <= end_time
+
+def update_jobs_offpeak():
+    config.read_config()
+    is_offpeak = _is_offpeak(config.mercure.offpeak_start, config.mercure.offpeak_end, datetime.now().time())
+    logger.info(f"is_offpeak {is_offpeak}")
+    for job in get_all_jobs("batch"):
+        if not job.meta.get("offpeak"):
+            continue
+        if job.get_status() not in ("waiting", "running", "queued", "deferred"):
+            continue
+
+        if is_offpeak:
+            logger.info(f"{job.meta}, {job.get_status()}")
+            if job.meta.get("paused", False):
+                logger.info("Resuming")
+                resume_job(job)
+        else:
+            if not job.meta.get("paused", False):
+                logger.info("Pausing")
+                pause_job(job)
+
+@router.post("/query/retry_job")
+@requires(["authenticated", "admin"], redirect="login")
+async def test_offpeak(request):
+    job = worker_queue.fetch_job(request.query_params['id'])
+    retry_job(job)
+    return JSONResponse({})
+@router.post("/query/pause_job")
+@requires(["authenticated", "admin"], redirect="login")
+async def post_pause_job(request):
+    job = worker_queue.fetch_job(request.query_params['id'])
+    if not job:
+        return JSONResponse({'error': 'Job not found'}, status_code=404)
+    if job.is_finished or job.is_failed:
+        return JSONResponse({'error': 'Job is already finished'}, status_code=400)
+    pause_job(job)
+    return JSONResponse({'status': 'success'}, status_code=200)
+
+@router.post("/query/resume_job")
+@requires(["authenticated", "admin"], redirect="login")
+async def post_resume_job(request):
+    job = worker_queue.fetch_job(request.query_params['id'])
+    if not job:
+        return JSONResponse({'error': 'Job not found'}, status_code=404)
+    if job.is_finished or job.is_failed:
+        return JSONResponse({'error': 'Job is already finished'}, status_code=400)
+    
+    resume_job(job)
     return JSONResponse({'status': 'success'}, status_code=200)
 
 @router.get("/query/job_info")
@@ -166,7 +290,8 @@ async def get_job_info(request):
     subjob_info = []
     subjobs = (worker_queue.fetch_job(job) for job in job.kwargs.get('subjobs', []))
     for subjob in subjobs:
-        info = {'id': subjob.get_id(),
+        info = {
+                'id': subjob.get_id(),
                 'ended_at': subjob.ended_at.isoformat().split('.')[0] if subjob.ended_at else "", 
                 'created_at_dt':subjob.created_at,
                 'accession': subjob.kwargs['accession'],
@@ -180,6 +305,8 @@ async def get_job_info(request):
     subjob_info = sorted(subjob_info, key=lambda x:x['created_at_dt'])
     return templates.TemplateResponse("dashboards/query_job_fragment.html", {"request":request,"job":job,"subjob_info":subjob_info})
 
+
+
 @router.post("/query")
 @requires(["authenticated", "admin"], redirect="login")
 async def query_post_batch(request):
@@ -192,26 +319,15 @@ async def query_post_batch(request):
             node = n
             break
     destination = form.get("destination")
+    dest_path = None
     for d in config.mercure.dicom_retrieve.destination_folders:
         if d.name == destination:
-            destination_path = d.path
-    random_accessions = ["".join(random.choices([str(i) for i in range(10)], k=5)) for _ in range(3)]
-    jobs = []
-    with Connection(redis):
-        for accession in random_accessions:
-            job = Job.create(dummy_job, kwargs=dict(accession=accession, node=node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_batch",parent=None, paused=False))
-            jobs.append(job)
-        full_job = Job.create(batch_job, kwargs=dict(accessions=random_accessions, subjobs=[j.id for j in jobs], destination=destination_path), timeout=-1, result_ttl=-1, meta=dict(type="batch", started=0, paused=False,completed=0, total=len(jobs)), depends_on=[j.id for j in jobs])
-        for j in jobs:
-            j.meta["parent"] = full_job.id
-            j.kwargs["path"] = f"/opt/mercure/data/query/job_dirs/{full_job.id}/{j.kwargs['accession']}"
-        full_job.kwargs["path"] = Path(f"/opt/mercure/data/query/job_dirs/{full_job.id}")
-        full_job.kwargs["path"].mkdir(parents=True)
-
-    for j in jobs:
-        worker_queue.enqueue_job(j)
-    worker_queue.enqueue_job(full_job)
+            dest_path = d.path
+            break
 
+    random_accessions = ["".join(random.choices([str(i) for i in range(10)], k=10)) for _ in range(3)]
+    offpeak = 'offpeak' in form
+    create_job(random_accessions, node, dest_path, offpeak=offpeak)
     # worker_scheduler.schedule(scheduled_time=datetime.utcnow(), func=monitor_job, interval=10, repeat=10, result_ttl=-1)
     return PlainTextResponse()
 
@@ -230,46 +346,26 @@ async def query_post(request):
     worker_queue.enqueue_call(query_job, kwargs=dict(accession=form.get("accession"), node=node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_single"))
     return PlainTextResponse()
 
+
 @router.get("/query/jobs")
 @requires(["authenticated", "admin"], redirect="login")
 async def query_jobs(request):
-    registries = [
-        worker_queue.started_job_registry,  # Returns StartedJobRegistry
-        worker_queue.deferred_job_registry,   # Returns DeferredJobRegistry
-        worker_queue.finished_job_registry,  # Returns FinishedJobRegistry
-        worker_queue.failed_job_registry,  # Returns FailedJobRegistry 
-        worker_queue.scheduled_job_registry,  # Returns ScheduledJobRegistry
-        worker_queue.canceled_job_registry,   # Returns CanceledJobRegistry
-    ]
     job_info = []
-    # logger.info(worker_queue.job_ids)
-    # for registry in registries:
-    job_ids = set()
-    for registry in registries:
-        for j_id in registry.get_job_ids():
-            job_ids.add(j_id)
-    for j_id in worker_queue.job_ids:
-        job_ids.add(j_id)
-
-    for j_id in job_ids:
-        job = worker_queue.fetch_job(j_id)
-        job_meta = job.get_meta()
-        if job_meta.get('type') != 'batch':
-            continue
-        job_dict = dict(id=j_id, 
+    for job in get_all_jobs("batch"):
+        job_dict = dict(id=job.id, 
                                 status=job.get_status(), 
                                 parameters=dict(accession=job.kwargs.get('accession','')), 
                                 created_at=1000*datetime.timestamp(job.created_at) if job.created_at else "",
                                 enqueued_at=1000*datetime.timestamp(job.enqueued_at) if job.enqueued_at else "", 
                                 result=job.result, 
-                                meta=job_meta,
+                                meta=job.meta,
                                 progress="")
         # if job.meta.get('completed') and job.meta.get('remaining'):
         #     job_dict["progress"] = f"{job.meta.get('completed')} / {job.meta.get('completed') + job.meta.get('remaining')}"
         # if job.meta.get('type',None) == "batch":
-        n_started = job_meta.get('started',0)
-        n_completed = job_meta.get('completed',0)
-        n_total = job_meta.get('total',0)
+        n_started = job.meta.get('started',0)
+        n_completed = job.meta.get('completed',0)
+        n_total = job.meta.get('total',0)
 
         if job_dict["status"] == "finished":
             job_dict["progress"] = f"{n_total} / {n_total}"
@@ -277,19 +373,19 @@ async def query_jobs(request):
             job_dict["progress"] = f"{n_completed} / {n_total}"
         
         # if job_dict["status"] == "canceled" and 
-        if job_dict["meta"].get('paused', False):
+        if job_dict["meta"].get('paused', False) and job_dict["status"] not in ("finished", "failed"):
             if n_started < n_completed: # TODO: this does not work
                 job_dict["status"] = "pausing"
             else:
                 job_dict["status"] = "paused"
 
-        if job_dict["status"] in ("deferred", "started"):
-            if n_started == 0:
-                job_dict["status"] = "waiting"
-            elif n_completed < n_total:
-                job_dict["status"] = "running"
-            elif n_completed == n_total:
-                job_dict["status"] = "finishing"
+        # if job_dict["status"] in ("deferred", "started"):
+            # if n_started == 0:
+            #     job_dict["status"] = "waiting"
+            # elif n_completed < n_total:
+            #     job_dict["status"] = "running"
+            # elif n_completed == n_total:
+            #     job_dict["status"] = "finishing"
 
         job_info.append(job_dict)
     return JSONResponse(dict(data=job_info))
diff --git a/webinterface/templates/dashboards/query.html b/webinterface/templates/dashboards/query.html
index 085cc209..45ad8f5b 100644
--- a/webinterface/templates/dashboards/query.html
+++ b/webinterface/templates/dashboards/query.html
@@ -64,6 +64,22 @@ <h1 class="title">DICOM Query</h1>
                 </div>
               </div>
             </div>
+
+            <div class="field is-horizontal">
+              <div class="field-label is-normal">
+                <label class="label">Offpeak</label>
+              </div>
+              <div class="field-body">
+                <div class="field">
+                  <div class="control is-expanded">
+                    <label class="checkbox">
+                      <input type="checkbox" id="offpeak" name="offpeak" value="">
+                    </div>
+                  </div>
+                </div>
+              </div>
+            </div>
+
             <div class="field is-horizontal">
               <div class="field-label">
                 <!-- Left empty for spacing -->
@@ -153,7 +169,7 @@ <h1 class="title">DICOM Query</h1>
                 defaultContent: ''
             },
             { data: 'id' },
-            { data: 'meta', render: data => data["type"]? data["type"]:"" },
+            { data: 'meta', render: data => (data["type"]? data["type"]:"") + (data["offpeak"]? " (offpeak)":"")},
             { data: 'status' },
             { data: 'created_at', render: data => `<span style="display:none;">${data || Date.now()  }</span>`+(data? new Date(data).toLocaleString("en-US"):"")},
             { data: 'parameters', render: data => data["accession"] || ""},
@@ -169,13 +185,32 @@ <h1 class="title">DICOM Query</h1>
         },
         // filter: true,
         buttons: [
+        {
+                    extend: "customEnable",
+                    text: '<i class="fas fa-sync"></i>',
+                    titleAttr: 'test',
+                    enabled: function(dt, node, config) {
+                      let data = dt.row({selected: true}).data();
+                      if (!data) {
+                          return false;
+                      }
+                      return data.status == "failed"
+                    },
+                    action: function ( e, dt, node, config ) {
+                      let data = dt.row({selected: true}).data();
+                      fetch(`query/retry_job?id=${data.id}`, {method:"POST"}).then(()=>{
+                            dt.ajax.reload()
+                        }).catch((err)=>{
+                            console.log("Error: ", err)
+                        })
+                    }
+          },
           {
                     extend: "customEnable",
                     text: '<i class="fas fa-pause"></i>',
                     titleAttr: 'Pause/Resume',
                     enabled: function(dt, node, config) {
                       let data = dt.row({selected: true}).data();
-                      console.log(node);
                       if (!data) {
                           return false;
                       }

From 373ef6e00264c2562a846638abde7dff9a6e7b5f Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 28 Jun 2024 17:57:48 +0000
Subject: [PATCH 17/42] fixes

---
 webinterface/dashboards/query.py             | 14 +++++++-------
 webinterface/templates/dashboards/query.html |  8 ++++----
 2 files changed, 11 insertions(+), 11 deletions(-)

diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
index ddd4dc6c..cd682818 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query.py
@@ -379,13 +379,13 @@ async def query_jobs(request):
             else:
                 job_dict["status"] = "paused"
 
-        # if job_dict["status"] in ("deferred", "started"):
-            # if n_started == 0:
-            #     job_dict["status"] = "waiting"
-            # elif n_completed < n_total:
-            #     job_dict["status"] = "running"
-            # elif n_completed == n_total:
-            #     job_dict["status"] = "finishing"
+        if job_dict["status"] in ("deferred", "started"):
+            if n_started == 0:
+                job_dict["status"] = "waiting"
+            elif n_completed < n_total:
+                job_dict["status"] = "running" 
+            elif n_completed == n_total:
+                job_dict["status"] = "finishing" 
 
         job_info.append(job_dict)
     return JSONResponse(dict(data=job_info))
diff --git a/webinterface/templates/dashboards/query.html b/webinterface/templates/dashboards/query.html
index 45ad8f5b..f34a459d 100644
--- a/webinterface/templates/dashboards/query.html
+++ b/webinterface/templates/dashboards/query.html
@@ -187,7 +187,7 @@ <h1 class="title">DICOM Query</h1>
         buttons: [
         {
                     extend: "customEnable",
-                    text: '<i class="fas fa-sync"></i>',
+                    text: '<i class="fas fa-sync"></i>&nbsp;Retry',
                     titleAttr: 'test',
                     enabled: function(dt, node, config) {
                       let data = dt.row({selected: true}).data();
@@ -207,7 +207,7 @@ <h1 class="title">DICOM Query</h1>
           },
           {
                     extend: "customEnable",
-                    text: '<i class="fas fa-pause"></i>',
+                    text: '<i class="fas fa-pause"></i>&nbsp;Pause',
                     titleAttr: 'Pause/Resume',
                     enabled: function(dt, node, config) {
                       let data = dt.row({selected: true}).data();
@@ -215,9 +215,9 @@ <h1 class="title">DICOM Query</h1>
                           return false;
                       }
                       if (data.status == "paused") {
-                        node.html('<i class="fas fa-play"></i>')
+                        node.html('<i class="fas fa-play"></i>&nbsp;Resume')
                       } else {
-                        node.html('<i class="fas fa-pause"></i>')
+                        node.html('<i class="fas fa-pause"></i>&nbsp;Pause')
                       }
                       return (data.status == "paused" || data.status == "deferred" || data.status == "queued" || data.status == "running");
                     },

From c1acf2708ab7629f375ee3be0d8c1901fb2c0aad Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 28 Jun 2024 17:57:48 +0000
Subject: [PATCH 18/42] query: refactor, check to see if all accessions exist
 first, show failure reasons, move accession to destination as received

---
 webinterface/dashboards/query.py | 209 +++++++++++++++++--------------
 webinterface/query.py            |   2 +-
 2 files changed, 118 insertions(+), 93 deletions(-)

diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
index cd682818..9cdc0156 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query.py
@@ -23,112 +23,132 @@
 
 
 
-def query_job(*,accession, node):
+def get_accession_job(job_id, job_kwargs):
+    accession, node, path = job_kwargs["accession"], job_kwargs["node"], job_kwargs["path"]
     config.read_config()
-    c = SimpleDicomClient(node.ip, node.port, node.aet_target, config.mercure.incoming_folder)
-    job = get_current_job()
-    job.meta["started"] = 1
-    job.save_meta()
+    c = SimpleDicomClient(node.ip, node.port, node.aet_target, path)
+    # job = get_current_job()
+    # job.meta["started"] = 1
+    # job.save_meta()
     for identifier in c.getscu(accession):
-        job.meta['failed'] = identifier.NumberOfFailedSuboperations
-        job.meta['remaining'] = identifier.NumberOfRemainingSuboperations
-        job.meta['completed'] = identifier.NumberOfCompletedSuboperations
-        if not job.meta.get('total', False):
-            job.meta['total'] = identifier.NumberOfCompletedSuboperations + identifier.NumberOfRemainingSuboperations
-        job.meta["started"] += 1
-        job.save_meta()
+        completed, remaining = identifier.NumberOfCompletedSuboperations, identifier.NumberOfRemainingSuboperations, 
+        progress = f"{ completed } / { completed + remaining }"
+        yield completed, remaining, progress
     return "Complete"
 
-
-def dummy_job(*,accession, node, path):
-    print(f"Getting {accession}")
-    job = get_current_job()
+def check_accessions_exist(*, accessions, node):
+    c = SimpleDicomClient(node.ip, node.port, node.aet_target, None)
     try:
-        Path(path).mkdir(parents=True, exist_ok=True)
-        total_time = 10  # Total time for the job in seconds (1 minute)
-        update_interval = 1  # Interval between updates in seconds
-
-        start_time = time.monotonic()
-        if job.meta.get('parent'):
-            job_parent = worker_queue.fetch_job(job.meta['parent'])
-        else:
-            job_parent = None
-        # failed = 0
-        remaining = total_time // update_interval
-        completed = 0
-
-        if job_parent:
-            job_parent.meta['started'] = job_parent.meta.get('started',0) + 1
-            job_parent.save_meta()
-
-        job.meta['started'] = 1
-        job.meta['total'] = remaining
-        job.meta['progress'] = f"0 / {job.meta['total']}"
-        job.save_meta()
-        while (time.monotonic() - start_time) < total_time:
-            time.sleep(update_interval)  # Sleep for the interval duration
-            out_file = (Path(path) / f"dummy{completed}_{job.id}.dcm")
-            if out_file.exists():
-                raise Exception(f"{out_file} exists already")
-            out_file.touch()
-            remaining -= 1
-            completed += 1
-
-            # job.meta['failed'] = failed
-            job.meta['remaining'] = remaining
-            job.meta['completed'] = completed
-            job.meta['progress'] = f"{completed} / {job.meta['total']}"
-            print(job.meta['progress'])
-            job.save_meta()  # Save the updated meta data to the job
-        
-        if job_parent:
-            job_parent.get_meta() # there is technically a race condition here...
-            job_parent.meta['completed'] += 1
-            job_parent.meta['progress'] = f"{job_parent.meta['started'] } / {job_parent.meta['completed'] } / {job_parent.meta['total']}"
-
-            job_parent.save_meta()
+        for accession in accessions:
+            result = c.findscu(accession)
+            logger.info(result)
     except:
-        if not job_parent:
-            raise
-        # Cancel remaining sibling jobs
-        logger.info("Cancelling sibling jobs.")
-        for subjob_id in job_parent.kwargs.get('subjobs',[]):
-            if subjob_id == job.id:
-                continue
-            subjob = worker_queue.fetch_job(subjob_id)
-            if subjob.get_status() not in ('finished', 'canceled','failed'):
-                subjob.cancel()
-        job_parent.get_meta() 
-        logger.info("Cancelled sibling jobs.")
-        worker_queue._enqueue_job(job_parent) # Force the parent job to run and fail itself
+        job = get_current_job()
+        job_parent = worker_queue.fetch_job(job.meta.get('parent'))
+        job_parent.meta['failed_reason'] = f"Accession {accession} not found on node"
+        worker_queue._enqueue_job(job_parent,at_front=True)
         raise
+def query_dummy(job_id, job_kwargs):
+    total_time = 2  # Total time for the job in seconds (1 minute)
+    update_interval = 0.25  # Interval between updates in seconds
+    remaining = total_time // update_interval
+    completed = 0
+    start_time = time.monotonic()
+
+    while (time.monotonic() - start_time) < total_time:
+        time.sleep(update_interval)  # Sleep for the interval duration
+        out_file = (Path(job_kwargs['path']) / f"dummy{completed}_{job_id}.dcm")
+        if out_file.exists():
+            raise Exception(f"{out_file} exists already")
+        out_file.touch()
+        remaining -= 1
+        completed += 1
+
+        yield completed, remaining, f"{completed} / {remaining + completed}"
+
+class QueryJob():
+
+    @classmethod
+    def get_accessions(cls, *,accession, node, path, perform_func=query_dummy):
+        print(f"Getting {accession}")
+        job = get_current_job()
+        try:
+            Path(path).mkdir(parents=True, exist_ok=True)
+            job_parent = None
+            if parent_id := job.meta.get('parent'):
+                job_parent = worker_queue.fetch_job(parent_id)
+
+            if job_parent:
+                job_parent.meta['started'] = job_parent.meta.get('started',0) + 1
+                job_parent.save_meta()
+
+            job.meta['started'] = 1
+            job.meta['progress'] = "0 / Unknown"
+            job.save_meta()
+            for completed, remaining, progress in perform_func(job.id, job.kwargs):
+                job.meta['remaining'] = remaining
+                job.meta['completed'] = completed
+                job.meta['progress'] = progress
+                job.save_meta()  # Save the updated meta data to the job
+                logger.info(progress)
+            if job_parent.kwargs["move_promptly"]:
+                move_to_destination(path, job_parent.kwargs["destination"], job_parent.id)
+            if job_parent:
+                job_parent.get_meta() # there is technically a race condition here...
+                job_parent.meta['completed'] += 1
+                job_parent.meta['progress'] = f"{job_parent.meta['started'] } / {job_parent.meta['completed'] } / {job_parent.meta['total']}"
+                job_parent.save_meta()
+        except:
+            if not job_parent:
+                raise
+            # Cancel remaining sibling jobs
+            logger.info("Cancelling sibling jobs.")
+            for subjob_id in job_parent.kwargs.get('subjobs',[]):
+                if subjob_id == job.id:
+                    continue
+                subjob = worker_queue.fetch_job(subjob_id)
+                if subjob.get_status() not in ('finished', 'canceled','failed'):
+                    subjob.cancel()
+            job_parent.get_meta() 
+            logger.info("Cancelled sibling jobs.")
+            job_parent.meta["failed_reason"] = f"Failed to retrieve {accession}"
+            worker_queue._enqueue_job(job_parent,at_front=True) # Force the parent job to run and fail itself
+            raise
 
-    return "Job complete"
+        return "Job complete"
 
-def batch_job(*, accessions, subjobs, path, destination):
+def move_to_destination(path, destination, job_id):
+    if destination is None:
+        config.read_config()
+        for p in Path(path).glob("**/*"):
+            if p.is_file():
+                shutil.move(p, config.mercure.incoming_folder)
+        shutil.rmtree(path)
+    else:
+        dest_folder: Path = Path(destination) / job_id
+        dest_folder.mkdir(exist_ok=True)
+        logger.info(f"moving {path} to {dest_folder}")
+        shutil.move(path, dest_folder)
+
+def batch_job(*, accessions, subjobs, path, destination, move_promptly):
     job = get_current_job()
     job.get_meta()
     for job_id in job.kwargs.get('subjobs',[]):
         subjob = worker_queue.fetch_job(job_id)
         if (status := subjob.get_status()) != 'finished':
             raise Exception(f"Subjob {subjob.id} is {status}")
+        if job.kwargs.get('failed', False):
+            raise Exception(f"Failed")
 
     logger.info(f"Job completing {job.id}")
-    logger.info(path)
-    config.read_config()
-    if destination is None:
-        for p in Path(path).glob("**/*"):
-            if p.is_file():
-                shutil.move(p, config.mercure.incoming_folder)
-    else:
-        dest_folder: Path = Path(destination) / job.id
-        dest_folder.mkdir()
-        for p in Path(path).iterdir():
-            if p.is_dir():
-                logger.info(f"moving {p} to {dest_folder}")
-                shutil.move(p, dest_folder)
 
+    if not move_promptly:
+        for p in Path(path).iterdir():
+            if not p.is_dir():
+                continue
+            move_to_destination(p, destination, job.id)
     shutil.rmtree(path)
+
     return "Job complete"
 
 
@@ -161,19 +181,24 @@ def resume_job(job: Job):
 def create_job(accessions, dicom_node, destination_path, offpeak=False) -> Job:
     with Connection(redis):
         jobs = []
+        check_job = Job.create(check_accessions_exist, kwargs=dict(accessions=accessions,node=dicom_node), meta=dict(parent=None))
+
         for accession in accessions:
-            job = Job.create(dummy_job, kwargs=dict(accession=accession, node=dicom_node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_batch",parent=None, paused=False, offpeak=offpeak))
+            job = Job.create(QueryJob.get_accessions, kwargs=dict(perform_func=get_accession_job, accession=accession, node=dicom_node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_batch",parent=None, paused=False, offpeak=offpeak),depends_on=[check_job])
             jobs.append(job)
         depends = Dependency(
             jobs=jobs,
             allow_failure=True,    # allow_failure defaults to False
         )
-        full_job = Job.create(batch_job, kwargs=dict(accessions=accessions, subjobs=[j.id for j in jobs], destination=destination_path), timeout=-1, result_ttl=-1, meta=dict(type="batch", started=0, paused=False,completed=0, total=len(jobs), offpeak=offpeak), depends_on=depends)
+        full_job = Job.create(batch_job, kwargs=dict(accessions=accessions, subjobs=[j.id for j in jobs], destination=destination_path, move_promptly=True), timeout=-1, result_ttl=-1, meta=dict(type="batch", started=0, paused=False,completed=0, total=len(jobs), offpeak=offpeak), depends_on=depends)
+        check_job.meta["parent"] = full_job.id
         for j in jobs:
             j.meta["parent"] = full_job.id
             j.kwargs["path"] = f"/opt/mercure/data/query/job_dirs/{full_job.id}/{j.kwargs['accession']}"
         full_job.kwargs["path"] = Path(f"/opt/mercure/data/query/job_dirs/{full_job.id}")
         full_job.kwargs["path"].mkdir(parents=True)
+
+    worker_queue.enqueue_job(check_job)
     for j in jobs:
         worker_queue.enqueue_job(j)
     worker_queue.enqueue_job(full_job)
@@ -325,9 +350,9 @@ async def query_post_batch(request):
             dest_path = d.path
             break
 
-    random_accessions = ["".join(random.choices([str(i) for i in range(10)], k=10)) for _ in range(3)]
+    # random_accessions = ["".join(random.choices([str(i) for i in range(10)], k=10)) for _ in range(3)]
     offpeak = 'offpeak' in form
-    create_job(random_accessions, node, dest_path, offpeak=offpeak)
+    create_job(form.get("accession").split(","), node, dest_path, offpeak=offpeak)
     # worker_scheduler.schedule(scheduled_time=datetime.utcnow(), func=monitor_job, interval=10, repeat=10, result_ttl=-1)
     return PlainTextResponse()
 
@@ -357,7 +382,7 @@ async def query_jobs(request):
                                 parameters=dict(accession=job.kwargs.get('accession','')), 
                                 created_at=1000*datetime.timestamp(job.created_at) if job.created_at else "",
                                 enqueued_at=1000*datetime.timestamp(job.enqueued_at) if job.enqueued_at else "", 
-                                result=job.result, 
+                                result=job.result if job.get_status() != "failed" else job.meta.get("failed_reason",""), 
                                 meta=job.meta,
                                 progress="")
         # if job.meta.get('completed') and job.meta.get('remaining'):
diff --git a/webinterface/query.py b/webinterface/query.py
index fa1077e2..40187abb 100644
--- a/webinterface/query.py
+++ b/webinterface/query.py
@@ -183,7 +183,7 @@ def getscu(self, accession_number):
 
     def findscu(self,accession_number):
         # Create application entity
-        ae = AE(ae_title=calling_aet)
+        ae = AE(ae_title="MERCURE")
 
         # Add a requested presentation context
         # ae.add_requested_context(StudyRootQueryRetrieveInformationModelFind)

From 5c74407af81d7f27aaa84bb3cead53712331b3f2 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 28 Jun 2024 17:57:48 +0000
Subject: [PATCH 19/42] satisfy mypy

---
 common/rule_evaluation.py        |  10 +-
 common/tags_rule_interface.py    |   9 +-
 tests/test_notifications.py      |   1 +
 tests/test_processor.py          |   5 +-
 tests/test_query.py              |   5 +
 tests/test_router.py             |   2 +
 webinterface/dashboards/query.py | 153 ++++++++++++++++++++-----------
 webinterface/query.py            |  18 ++--
 webinterface/rules.py            |   4 +-
 9 files changed, 133 insertions(+), 74 deletions(-)
 create mode 100644 tests/test_query.py

diff --git a/common/rule_evaluation.py b/common/rule_evaluation.py
index 513ba9fa..65359150 100755
--- a/common/rule_evaluation.py
+++ b/common/rule_evaluation.py
@@ -48,14 +48,14 @@ def replace_tags(rule: str, tags: Dict[str, str]) -> Any:
 safe_eval_cmds = {"float": float, "int": int, "str": str, "len": len, "bool": bool, "sum": sum, "round": round, "max": max, "min": min, "abs": abs, "pow": pow, "chr": chr, "ord": ord}
 
 
-def eval_rule(rule: str, tags: Dict[str, str]) -> Any:
+def eval_rule(rule: str, tags_dict: Dict[str, str]) -> Any:
     """Parses the given rule, replaces all tag variables with values from the given tags dictionary, and
     evaluates the rule. If the rule is invalid, an exception will be raised."""
     logger.info(f"Rule: {rule}")
-    rule = replace_tags(rule, tags)
+    rule = replace_tags(rule, tags_dict)
     logger.info(f"Evaluated: {rule}")
     try:
-        tags = Tags(tags)
+        tags = Tags(tags_dict)
         result = eval(rule, {"__builtins__": {}}, {**safe_eval_cmds,"tags":tags})
     except SyntaxError as e:
         opening = rule.find("@")
@@ -63,9 +63,9 @@ def eval_rule(rule: str, tags: Dict[str, str]) -> Any:
         if opening >-1 and closing>1:
             raise TagNotFoundException(f"No such tag '{rule[opening+1:closing]}' in tags list.")
         raise
-    logger.info(", ".join([f"{tag} = \"{tags[tag]}\"" for tag in tags._attrs_accessed()]))
+    logger.info(", ".join([f"{tag} = \"{tags_dict[tag]}\"" for tag in tags.tags_accessed()]))
     logger.info(f"Result: {result}")
-    return result, tags._attrs_accessed()
+    return result, tags.tags_accessed()
 
 def parse_rule(rule: str, tags: Dict[str, str]) -> Tuple[bool,Optional[str], Optional[str]]:
     try: 
diff --git a/common/tags_rule_interface.py b/common/tags_rule_interface.py
index 4dddda0c..a3d35587 100644
--- a/common/tags_rule_interface.py
+++ b/common/tags_rule_interface.py
@@ -1,12 +1,15 @@
+from typing import Dict, Set
+
+
 class Tags:
-    _tags_dict = None
-    _tags_accessed = None
+    _tags_dict: Dict[str,str] = {}
+    _tags_accessed: Set[str] = set()
 
     def __init__(self, input_dict) -> None:
         self._tags_dict = input_dict
         self._tags_accessed = set()
 
-    def tags_accessed(self):
+    def tags_accessed(self) -> Set[str]:
         return self._tags_accessed
 
     def __getattr__(self, name):
diff --git a/tests/test_notifications.py b/tests/test_notifications.py
index 36c717e0..c6d5b9f4 100644
--- a/tests/test_notifications.py
+++ b/tests/test_notifications.py
@@ -18,6 +18,7 @@
 import unittest.mock
 import itertools
 from typing import Iterator, Callable
+import pytest
 
 logger = config.get_logger()
 
diff --git a/tests/test_processor.py b/tests/test_processor.py
index 062e2fa1..4fd8d753 100755
--- a/tests/test_processor.py
+++ b/tests/test_processor.py
@@ -12,21 +12,19 @@
 import common
 from common.monitor import task_event
 
-import process.process_series
 import router
-import daiquiri
 import processor
 from itertools import permutations
 from common.constants import mercure_version, mercure_names
 
 import json
-from pprint import pprint
 from common.types import *
 import routing
 import routing.generate_taskfile
 from pathlib import Path
 
 from testing_common import *
+from testing_common import mock_task_ids
 
 from docker.models.containers import ContainerCollection
 from docker.models.images import ImageCollection
@@ -36,6 +34,7 @@
 import socket
 
 from typing import Callable
+import pytest
 
 logger = config.get_logger()
 
diff --git a/tests/test_query.py b/tests/test_query.py
new file mode 100644
index 00000000..975cabc3
--- /dev/null
+++ b/tests/test_query.py
@@ -0,0 +1,5 @@
+from testing_common import *
+from pyfakefs.fake_filesystem import FakeFilesystem
+
+def test_query(fs: FakeFilesystem, mercure_config, mocked):
+    pass
\ No newline at end of file
diff --git a/tests/test_router.py b/tests/test_router.py
index 24d09505..0bfe69dc 100755
--- a/tests/test_router.py
+++ b/tests/test_router.py
@@ -25,6 +25,8 @@
 
 from testing_common import *
 
+from testing_common import mock_task_ids
+
 # import common.config as config
 
 rules = {
diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
index 9cdc0156..d459ae6a 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query.py
@@ -1,6 +1,7 @@
 
 from pathlib import Path
 import shutil
+from typing import Generator, List, Union, cast
 from webinterface.query import SimpleDicomClient
 # Standard python includes
 from datetime import datetime
@@ -24,19 +25,25 @@
 
 
 def get_accession_job(job_id, job_kwargs):
+    """
+    
+    """
     accession, node, path = job_kwargs["accession"], job_kwargs["node"], job_kwargs["path"]
     config.read_config()
     c = SimpleDicomClient(node.ip, node.port, node.aet_target, path)
     # job = get_current_job()
     # job.meta["started"] = 1
-    # job.save_meta()
+    # job.save_meta() # type: ignore
     for identifier in c.getscu(accession):
         completed, remaining = identifier.NumberOfCompletedSuboperations, identifier.NumberOfRemainingSuboperations, 
-        progress = f"{ completed } / { completed + remaining }"
+        progress = f"{ completed } / { completed + remaining }" 
         yield completed, remaining, progress
     return "Complete"
 
-def check_accessions_exist(*, accessions, node):
+def check_accessions_exist(*, accessions, node, queue=worker_queue):
+    """
+    Check if the given accessions exist on the node using a DICOM query.
+    """
     c = SimpleDicomClient(node.ip, node.port, node.aet_target, None)
     try:
         for accession in accessions:
@@ -44,11 +51,16 @@ def check_accessions_exist(*, accessions, node):
             logger.info(result)
     except:
         job = get_current_job()
-        job_parent = worker_queue.fetch_job(job.meta.get('parent'))
+        if not job:
+            raise Exception("No current job found")
+        job_parent = queue.fetch_job(job.meta.get('parent'))
         job_parent.meta['failed_reason'] = f"Accession {accession} not found on node"
-        worker_queue._enqueue_job(job_parent,at_front=True)
+        queue._enqueue_job(job_parent,at_front=True)
         raise
 def query_dummy(job_id, job_kwargs):
+    """
+    Dummy function to simulate a long-running task.
+    """
     total_time = 2  # Total time for the job in seconds (1 minute)
     update_interval = 0.25  # Interval between updates in seconds
     remaining = total_time // update_interval
@@ -69,14 +81,16 @@ def query_dummy(job_id, job_kwargs):
 class QueryJob():
 
     @classmethod
-    def get_accessions(cls, *,accession, node, path, perform_func=query_dummy):
+    def get_accessions(cls, *,accession, node, path, perform_func=query_dummy,queue=worker_queue):
         print(f"Getting {accession}")
         job = get_current_job()
+        if not job:
+            raise Exception("No current job")
         try:
             Path(path).mkdir(parents=True, exist_ok=True)
             job_parent = None
             if parent_id := job.meta.get('parent'):
-                job_parent = worker_queue.fetch_job(parent_id)
+                job_parent = queue.fetch_job(parent_id)
 
             if job_parent:
                 job_parent.meta['started'] = job_parent.meta.get('started',0) + 1
@@ -84,12 +98,12 @@ def get_accessions(cls, *,accession, node, path, perform_func=query_dummy):
 
             job.meta['started'] = 1
             job.meta['progress'] = "0 / Unknown"
-            job.save_meta()
+            job.save_meta() # type: ignore
             for completed, remaining, progress in perform_func(job.id, job.kwargs):
                 job.meta['remaining'] = remaining
                 job.meta['completed'] = completed
                 job.meta['progress'] = progress
-                job.save_meta()  # Save the updated meta data to the job
+                job.save_meta() # type: ignore  # Save the updated meta data to the job
                 logger.info(progress)
             if job_parent.kwargs["move_promptly"]:
                 move_to_destination(path, job_parent.kwargs["destination"], job_parent.id)
@@ -106,23 +120,26 @@ def get_accessions(cls, *,accession, node, path, perform_func=query_dummy):
             for subjob_id in job_parent.kwargs.get('subjobs',[]):
                 if subjob_id == job.id:
                     continue
-                subjob = worker_queue.fetch_job(subjob_id)
+                subjob = queue.fetch_job(subjob_id)
                 if subjob.get_status() not in ('finished', 'canceled','failed'):
                     subjob.cancel()
             job_parent.get_meta() 
             logger.info("Cancelled sibling jobs.")
             job_parent.meta["failed_reason"] = f"Failed to retrieve {accession}"
-            worker_queue._enqueue_job(job_parent,at_front=True) # Force the parent job to run and fail itself
+            queue._enqueue_job(job_parent,at_front=True) # Force the parent job to run and fail itself
             raise
 
         return "Job complete"
 
-def move_to_destination(path, destination, job_id):
+def move_to_destination(path, destination, job_id) -> None:
+    """
+
+    """
     if destination is None:
         config.read_config()
         for p in Path(path).glob("**/*"):
             if p.is_file():
-                shutil.move(p, config.mercure.incoming_folder)
+                shutil.move(str(p), config.mercure.incoming_folder) # Move the file to incoming folder
         shutil.rmtree(path)
     else:
         dest_folder: Path = Path(destination) / job_id
@@ -130,11 +147,13 @@ def move_to_destination(path, destination, job_id):
         logger.info(f"moving {path} to {dest_folder}")
         shutil.move(path, dest_folder)
 
-def batch_job(*, accessions, subjobs, path, destination, move_promptly):
+def batch_job(*, accessions, subjobs, path, destination, move_promptly, queue=worker_queue) -> str:
     job = get_current_job()
+    if not job:
+        raise Exception("No current job")
     job.get_meta()
     for job_id in job.kwargs.get('subjobs',[]):
-        subjob = worker_queue.fetch_job(job_id)
+        subjob = queue.fetch_job(job_id)
         if (status := subjob.get_status()) != 'finished':
             raise Exception(f"Subjob {subjob.id} is {status}")
         if job.kwargs.get('failed', False):
@@ -156,38 +175,51 @@ def batch_job(*, accessions, subjobs, path, destination, move_promptly):
 def monitor_job():
     print("monitoring")
 
-def pause_job(job: Job):
+def pause_job(job: Job, queue=worker_queue):
+    """
+    Pause the current job, including all its subjobs.
+    """
     for job_id in job.kwargs.get('subjobs',[]):
-        subjob = worker_queue.fetch_job(job_id)
+        subjob = queue.fetch_job(job_id)
         if subjob and (subjob.is_deferred or subjob.is_queued):
             subjob.meta['paused'] = True
-            subjob.save_meta()
+            subjob.save_meta() # type: ignore
             subjob.cancel()
     job.get_meta()
     job.meta['paused'] = True
-    job.save_meta()
+    job.save_meta() # type: ignore
 
-def resume_job(job: Job):
+def resume_job(job: Job, queue=worker_queue):
+    """
+    Resume a paused job by unpausing all its subjobs
+    """
     for subjob_id in job.kwargs.get('subjobs',[]):
-        subjob = worker_queue.fetch_job(subjob_id)
+        subjob = queue.fetch_job(subjob_id)
         if subjob and subjob.meta.get('paused', None):
             subjob.meta['paused'] = False
-            subjob.save_meta()
-            worker_queue.canceled_job_registry.requeue(subjob_id)
+            subjob.save_meta() # type: ignore
+            queue.canceled_job_registry.requeue(subjob_id)
     job.get_meta()
     job.meta['paused'] = False
-    job.save_meta()
+    job.save_meta() # type: ignore
 
-def create_job(accessions, dicom_node, destination_path, offpeak=False) -> Job:
+def create_job(accessions, dicom_node, destination_path, offpeak=False, queue=worker_queue) -> Job:
+    """
+    Create a job to process the given accessions and store them in the specified destination path.
+    """
     with Connection(redis):
-        jobs = []
+        jobs: List[Job] = []
         check_job = Job.create(check_accessions_exist, kwargs=dict(accessions=accessions,node=dicom_node), meta=dict(parent=None))
 
         for accession in accessions:
-            job = Job.create(QueryJob.get_accessions, kwargs=dict(perform_func=get_accession_job, accession=accession, node=dicom_node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_batch",parent=None, paused=False, offpeak=offpeak),depends_on=[check_job])
+            job = Job.create(QueryJob.get_accessions, 
+                             kwargs=dict(perform_func=get_accession_job, accession=accession, node=dicom_node), timeout=30*60, result_ttl=-1, 
+                             meta=dict(type="get_accession_batch",parent=None, paused=False, offpeak=offpeak),
+                             depends_on=cast(List[Union[Dependency, Job]],[check_job])
+                             )
             jobs.append(job)
         depends = Dependency(
-            jobs=jobs,
+            jobs=cast(List[Union[Job,str]],jobs),
             allow_failure=True,    # allow_failure defaults to False
         )
         full_job = Job.create(batch_job, kwargs=dict(accessions=accessions, subjobs=[j.id for j in jobs], destination=destination_path, move_promptly=True), timeout=-1, result_ttl=-1, meta=dict(type="batch", started=0, paused=False,completed=0, total=len(jobs), offpeak=offpeak), depends_on=depends)
@@ -198,17 +230,20 @@ def create_job(accessions, dicom_node, destination_path, offpeak=False) -> Job:
         full_job.kwargs["path"] = Path(f"/opt/mercure/data/query/job_dirs/{full_job.id}")
         full_job.kwargs["path"].mkdir(parents=True)
 
-    worker_queue.enqueue_job(check_job)
+    queue.enqueue_job(check_job)
     for j in jobs:
-        worker_queue.enqueue_job(j)
-    worker_queue.enqueue_job(full_job)
+        queue.enqueue_job(j)
+    queue.enqueue_job(full_job)
 
     if offpeak and not _is_offpeak(config.mercure.offpeak_start, config.mercure.offpeak_end, datetime.now().time()):
         pause_job(full_job)
 
     return full_job
 
-def retry_job(job):
+def retry_job(job, queue=worker_queue) -> None:
+    """
+    Retry a failed job by enqueuing it again
+    """
     # job.meta["retries"] = job.meta.get("retries", 0) + 1
     # if job.meta["retries"] > 3:
     #     return False
@@ -218,27 +253,30 @@ def retry_job(job):
             logger.info(f"Retrying {subjob}")
             if status == "failed" and (job_path:=Path(subjob.kwargs['path'])).exists():
                 shutil.rmtree(job_path) # Clean up after a failed job
-            worker_queue.enqueue_job(subjob)
-    worker_queue.enqueue_job(job)
-def get_subjobs(job):
-    return (worker_queue.fetch_job(job) for job in job.kwargs.get('subjobs', []))
+            queue.enqueue_job(subjob)
+    queue.enqueue_job(job)
+def get_subjobs(job, queue=worker_queue) -> Generator:
+    return (queue.fetch_job(job) for job in job.kwargs.get('subjobs', []))
 
-def get_all_jobs(type):
+def get_all_jobs(type, queue=worker_queue) -> Generator:
+    """
+    Get all jobs of a given type from the queue
+    """
     registries = [
-        worker_queue.started_job_registry,  # Returns StartedJobRegistry
-        worker_queue.deferred_job_registry,   # Returns DeferredJobRegistry
-        worker_queue.finished_job_registry,  # Returns FinishedJobRegistry
-        worker_queue.failed_job_registry,  # Returns FailedJobRegistry 
-        worker_queue.scheduled_job_registry,  # Returns ScheduledJobRegistry
-        worker_queue.canceled_job_registry,   # Returns CanceledJobRegistry
+        queue.started_job_registry,  # Returns StartedJobRegistry
+        queue.deferred_job_registry,   # Returns DeferredJobRegistry
+        queue.finished_job_registry,  # Returns FinishedJobRegistry
+        queue.failed_job_registry,  # Returns FailedJobRegistry 
+        queue.scheduled_job_registry,  # Returns ScheduledJobRegistry
+        queue.canceled_job_registry,   # Returns CanceledJobRegistry
     ]
     job_ids = set()
     for registry in registries:
         for j_id in registry.get_job_ids():
             job_ids.add(j_id)
-    for j_id in worker_queue.job_ids:
+    for j_id in queue.job_ids:
         job_ids.add(j_id)
-    jobs = (worker_queue.fetch_job(j_id) for j_id in job_ids)
+    jobs = (queue.fetch_job(j_id) for j_id in job_ids)
 
     return (j for j in jobs if j.get_meta().get("type") == type)
 
@@ -251,15 +289,18 @@ def _is_offpeak(offpeak_start: str, offpeak_end: str, current_time) -> bool:
         return True
 
     if start_time < end_time:
-        return current_time >= start_time and current_time <= end_time
+        return bool(current_time >= start_time and current_time <= end_time)
     # End time is after midnight
-    return current_time >= start_time or current_time <= end_time
+    return bool(current_time >= start_time or current_time <= end_time)
 
-def update_jobs_offpeak():
+def update_jobs_offpeak(queue=worker_queue):
+    """
+    Resume or pause offpeak jobs based on whether the current time is within offpeak hours.
+    """
     config.read_config()
     is_offpeak = _is_offpeak(config.mercure.offpeak_start, config.mercure.offpeak_end, datetime.now().time())
     logger.info(f"is_offpeak {is_offpeak}")
-    for job in get_all_jobs("batch"):
+    for job in get_all_jobs("batch", queue=queue):
         if not job.meta.get("offpeak"):
             continue
         if job.get_status() not in ("waiting", "running", "queued", "deferred"):
@@ -269,18 +310,19 @@ def update_jobs_offpeak():
             logger.info(f"{job.meta}, {job.get_status()}")
             if job.meta.get("paused", False):
                 logger.info("Resuming")
-                resume_job(job)
+                resume_job(job, queue=queue)
         else:
             if not job.meta.get("paused", False):
                 logger.info("Pausing")
-                pause_job(job)
+                pause_job(job, queue=queue)
 
 @router.post("/query/retry_job")
 @requires(["authenticated", "admin"], redirect="login")
-async def test_offpeak(request):
+async def post_retry_job(request):
     job = worker_queue.fetch_job(request.query_params['id'])
     retry_job(job)
     return JSONResponse({})
+
 @router.post("/query/pause_job")
 @requires(["authenticated", "admin"], redirect="login")
 async def post_pause_job(request):
@@ -315,6 +357,8 @@ async def get_job_info(request):
     subjob_info = []
     subjobs = (worker_queue.fetch_job(job) for job in job.kwargs.get('subjobs', []))
     for subjob in subjobs:
+        if not subjob:
+            continue
         info = {
                 'id': subjob.get_id(),
                 'ended_at': subjob.ended_at.isoformat().split('.')[0] if subjob.ended_at else "", 
@@ -368,13 +412,16 @@ async def query_post(request):
             node = n
             break
     
-    worker_queue.enqueue_call(query_job, kwargs=dict(accession=form.get("accession"), node=node), timeout='30m', result_ttl=-1, meta=dict(type="get_accession_single"))
+    worker_queue.enqueue_call(get_accession_job, kwargs=dict(accession=form.get("accession"), node=node), timeout=30*60, result_ttl=-1, meta=dict(type="get_accession_single"))
     return PlainTextResponse()
 
 
 @router.get("/query/jobs")
 @requires(["authenticated", "admin"], redirect="login")
 async def query_jobs(request):
+    """
+    Returns a list of all query jobs. 
+    """
     job_info = []
     for job in get_all_jobs("batch"):
         job_dict = dict(id=job.id, 
diff --git a/webinterface/query.py b/webinterface/query.py
index 40187abb..54b87d4d 100644
--- a/webinterface/query.py
+++ b/webinterface/query.py
@@ -1,5 +1,6 @@
 import os
 import re
+from typing import Any, Iterator, List, Optional, Sequence, cast
 from pynetdicom import (
         AE,
         QueryRetrievePresentationContexts, BasicWorklistManagementPresentationContexts, UnifiedProcedurePresentationContexts,
@@ -7,11 +8,11 @@
         evt,
         StoragePresentationContexts
     )
-from pynetdicom.sop_class import StudyRootQueryRetrieveInformationModelFind
+from pynetdicom.sop_class import StudyRootQueryRetrieveInformationModelFind # type: ignore
 from pynetdicom.apps.common import create_dataset
 from pynetdicom._globals import DEFAULT_MAX_LENGTH
 from pynetdicom.pdu_primitives import SOPClassExtendedNegotiation
-from pynetdicom.sop_class import (
+from pynetdicom.sop_class import (  # type: ignore
     PatientRootQueryRetrieveInformationModelGet,
     StudyRootQueryRetrieveInformationModelGet,
     PatientStudyOnlyQueryRetrieveInformationModelGet,
@@ -19,12 +20,11 @@
     EncapsulatedOBJStorage,
     EncapsulatedMTLStorage,
 )
-from pydicom.uid import DeflatedExplicitVRLittleEndian
+from pydicom.uid import DeflatedExplicitVRLittleEndian 
 from pydicom import Dataset
 import sys
 import subprocess
 
-
 class DicomClientCouldNotAssociate(Exception):
     pass
 
@@ -58,7 +58,7 @@ class SimpleDicomClient():
     port: int
     called_aet: str
     output_dir: str
-    def __init__(self, host, port, called_aet, out_dir):
+    def __init__(self, host, port, called_aet, out_dir) -> None:
         self.host = host
         self.port = port
         self.called_aet = called_aet
@@ -124,7 +124,7 @@ def handle_store(self, event):
         return status_ds
 
 
-    def getscu(self, accession_number):
+    def getscu(self, accession_number) -> Iterator[Dataset]:
         # Exclude these SOP Classes
         _exclusion = [
             EncapsulatedSTLStorage,
@@ -145,6 +145,8 @@ def getscu(self, accession_number):
         ae.add_requested_context(PatientStudyOnlyQueryRetrieveInformationModelGet)
         ext_neg = []
         for cx in store_contexts:
+            if not cx.abstract_syntax:
+                raise ValueError(f"Abstract syntax must be specified for storage context {cx}")
             ae.add_requested_context(cx.abstract_syntax)
             # Add SCP/SCU Role Selection Negotiation to the extended negotiation
             # We want to act as a Storage SCP
@@ -153,7 +155,7 @@ def getscu(self, accession_number):
         assoc = ae.associate(
                 self.host, self.port,
                 ae_title=self.called_aet,
-                ext_neg=ext_neg,
+                ext_neg=ext_neg, # type: ignore
                 evt_handlers=[(evt.EVT_C_STORE, self.handle_store, [])],
                 max_pdu=0,
             )
@@ -181,7 +183,7 @@ def getscu(self, accession_number):
 
         assoc.release()
 
-    def findscu(self,accession_number):
+    def findscu(self,accession_number) -> Optional[Dataset]:
         # Create application entity
         ae = AE(ae_title="MERCURE")
 
diff --git a/webinterface/rules.py b/webinterface/rules.py
index 453964e9..71f869b5 100755
--- a/webinterface/rules.py
+++ b/webinterface/rules.py
@@ -6,7 +6,7 @@
 
 # Standard python includes
 import daiquiri
-from typing import Dict
+from typing import Any, Dict, Set
 import json
 
 # Starlette-related includes
@@ -252,7 +252,7 @@ async def rules_delete_post(request) -> Response:
 @requires(["authenticated", "admin"], redirect="login")
 async def rules_test(request) -> Response:
     """Evalutes if a given routing rule is valid. The rule and testing dictionary have to be passed as form parameters."""
-    noresult = set()
+    noresult: Set[Any] = set()
     attrs_accessed = set()
     try:
         form = dict(await request.form())

From 92f1582bfaab1d4093e1ca27c08464e5ea968cc0 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 23 Aug 2024 20:42:25 +0000
Subject: [PATCH 20/42] fix merge

---
 common/rule_evaluation.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/common/rule_evaluation.py b/common/rule_evaluation.py
index c31c03a2..71b36958 100755
--- a/common/rule_evaluation.py
+++ b/common/rule_evaluation.py
@@ -54,7 +54,7 @@ def eval_rule(rule: str, tags_dict: Dict[str, str]) -> Any:
     logger.info(f"Rule: {rule}")
     rule = replace_tags(rule, tags_dict)
     logger.info(f"Evaluated: {rule}")
-    tags_obj = Tags(tags)
+    tags_obj = Tags(tags_dict)
     try:
         result = eval(rule, {"__builtins__": {}}, {**safe_eval_cmds,"tags":tags_obj})
     except SyntaxError as e:
@@ -63,7 +63,7 @@ def eval_rule(rule: str, tags_dict: Dict[str, str]) -> Any:
         if opening >-1 and closing>1:
             raise TagNotFoundException(f"No such tag '{rule[opening+1:closing]}' in tags list.")
         raise
-    logger.info(", ".join([f"{tag} = \"{tags[tag]}\"" for tag in tags_obj.tags_accessed()]))
+    logger.info(", ".join([f"{tag} = \"{tags_dict[tag]}\"" for tag in tags_obj.tags_accessed()]))
     logger.info(f"Result: {result}")
     return result, tags_obj.tags_accessed()
 

From 1add6300586967953ffc6464ac73c4f7f0f7da42 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Tue, 27 Aug 2024 17:04:22 +0000
Subject: [PATCH 21/42] initial support for dicomweb add tests add
 "jobs_folder"

---
 common/types.py                  |  47 ++++++-
 tests/data/test_config.json      |   1 +
 tests/test_query.py              | 204 ++++++++++++++++++++++++++++++-
 tests/testing_common.py          |  24 +++-
 webinterface/common.py           |   3 -
 webinterface/dashboards/query.py | 162 +++++++++++++++++-------
 webinterface/query.py            |   4 +-
 7 files changed, 385 insertions(+), 60 deletions(-)

diff --git a/common/types.py b/common/types.py
index 5f3d5c6b..d45d819d 100755
--- a/common/types.py
+++ b/common/types.py
@@ -21,7 +21,6 @@ def get(self, item, els=None) -> Any:
 class EmptyDict(TypedDict):
     pass
 
-
 class Target(BaseModel, Compat):
     contact: Optional[str] = ""
     comment: str = ""
@@ -177,20 +176,59 @@ class ProcessingLogsConfig(BaseModel):
 
 class DicomReceiverConfig(BaseModel):
     additional_tags: Dict[str,str] = {}
-    
-class DicomNode(BaseModel):
+
+
+class DicomNodeBase(BaseModel):
+    name: str
+
+    @classmethod
+    def __get_validators__(cls):
+        # one or more validators may be yielded which will be called in the
+        # order to validate the input, each validator will receive as an input
+        # the value returned from the previous validator
+        yield cls.validate
+
+    @classmethod
+    def validate(cls, v):
+        """Parse the target as any of the known target types."""
+        subclass_dict: typing.Dict[str, Type[DicomNode]] = {sbc.__name__: sbc for sbc in cls.__subclasses__()}
+        for k in subclass_dict:
+            try:
+                return subclass_dict[k](**v)
+            except:
+                pass
+        raise ValueError("Couldn't validate dicom node as any of", list(subclass_dict.keys()))
+
+    @classmethod
+    def get_name(cls) -> str:
+        return cls.construct().node_type  # type: ignore
+
+
+class DicomNode(DicomNodeBase):
+    node_type: Literal["dicom"] = "dicom"
     name: str
     ip: str
     port: int
     aet_target: str
     aet_source: Optional[str] = ""
 
+class DicomWebNode(DicomNodeBase):
+    node_type: Literal["dicomweb"] = "dicomweb"
+    name: str
+    base_url: str
+
+    qido_url_prefix: Optional[str] = None
+    wado_url_prefix: Optional[str] = None
+    access_token: Optional[str] = None
+    ca_bundle: Optional[str] = None
+    cert: Optional[str] = None
+
 class DicomDestination(BaseModel):
     name: str
     path: str
 
 class DicomRetrieveConfig(BaseModel):
-    dicom_nodes: List[DicomNode] = []
+    dicom_nodes: List[DicomNodeBase] = []
     destination_folders: List[DicomDestination] = []
     
 class Config(BaseModel, Compat):
@@ -204,6 +242,7 @@ class Config(BaseModel, Compat):
     error_folder: str
     discard_folder: str
     processing_folder: str
+    jobs_folder: str
     router_scan_interval: int       # in seconds
     dispatcher_scan_interval: int   # in seconds
     cleaner_scan_interval: int      # in seconds
diff --git a/tests/data/test_config.json b/tests/data/test_config.json
index d5a2dc5f..cd23cbc3 100755
--- a/tests/data/test_config.json
+++ b/tests/data/test_config.json
@@ -8,6 +8,7 @@
     "error_folder": "/var/error",
     "discard_folder": "/var/discard",
     "processing_folder": "/var/processing",
+    "jobs_folder": "/var/jobs",
     "bookkeeper": "0.0.0.0:8080",
     "graphite_ip": "",
     "graphite_port": 2003,
diff --git a/tests/test_query.py b/tests/test_query.py
index 975cabc3..5d534977 100644
--- a/tests/test_query.py
+++ b/tests/test_query.py
@@ -1,5 +1,201 @@
-from testing_common import *
-from pyfakefs.fake_filesystem import FakeFilesystem
+import os
+from pathlib import Path
+import tempfile
+import pydicom
+import pytest
+from pynetdicom import AE, evt, StoragePresentationContexts, build_role
+from pynetdicom.sop_class import Verification, StudyRootQueryRetrieveInformationModelFind, StudyRootQueryRetrieveInformationModelGet,PatientRootQueryRetrieveInformationModelGet,  CTImageStorage
+from pynetdicom.status import Status
+from pydicom.uid import generate_uid
+from pydicom.dataset import Dataset, FileMetaDataset
+from rq import Worker
+from webinterface.dashboards.query import SimpleDicomClient, QueryJob, create_job
+from common.types import DicomNode, DicomWebNode
+from webinterface.common import redis, worker_queue
+from pyfakefs import fake_filesystem
 
-def test_query(fs: FakeFilesystem, mercure_config, mocked):
-    pass
\ No newline at end of file
+from pydicom.uid import ExplicitVRLittleEndian, ImplicitVRLittleEndian
+from testing_common import receiver_port, mercure_config
+from logging import getLogger
+from rq import SimpleWorker, Queue
+from fakeredis import FakeStrictRedis
+
+getLogger('pynetdicom').setLevel('WARNING')
+# Mock data for testing
+MOCK_ACCESSION = "12345"
+
+@pytest.fixture(scope="module")
+def mock_node(receiver_port):
+    return DicomNode(name="TestNode", ip="127.0.0.1", port=receiver_port, aet_target="TEST")
+
+class DummyDICOMServer:
+    """A simple DICOM server for testing purposes."""
+    def __init__(self, port, dataset:Dataset):
+        self.ae = AE()
+        # Add support for DICOM verification
+        self.ae.add_supported_context(Verification)
+        self.dataset = dataset
+        # Define handler for C-FIND requests
+        def handle_find(event):
+            ds = event.identifier
+
+            # Create a dummy response
+            # Check if the request matches our dummy data
+            if 'AccessionNumber' in ds and ds.AccessionNumber == MOCK_ACCESSION:
+                yield (0xFF00, self.dataset)
+            else:
+                yield (0x0000, None)  # Status 'Success', but no match
+
+        def handle_find(event):
+            ds = event.identifier
+            # Check if the request matches our dummy data
+            if 'AccessionNumber' in ds and ds.AccessionNumber == MOCK_ACCESSION:
+                yield (0xFF00, self.dataset)
+            else:
+                yield (0x0000, None)  # Status 'Success', but no match
+
+        # Define handler for C-GET requests
+        def handle_get(event):
+            ds = event.identifier
+            # yield 1
+            # Check if the request matches our dummy data
+            if 'AccessionNumber' in ds and ds.AccessionNumber == MOCK_ACCESSION:
+                # Create a dummy DICOM dataset
+                yield 1
+
+                dummy_ds = self.dataset.copy()
+                dummy_ds.SOPClassUID = CTImageStorage  # CT Image Storage
+                dummy_ds.SOPInstanceUID = generate_uid()
+                dummy_ds.file_meta = Dataset()
+                dummy_ds.file_meta.TransferSyntaxUID = ExplicitVRLittleEndian
+
+                # Yield the dataset
+                yield (0xFF00, dummy_ds)
+            else:
+                yield (0x0000, None)  # Status 'Success', but no match
+        # Bind the C-FIND handler
+
+
+        # Add the supported presentation contexts (Storage SCU)
+        self.ae.supported_contexts = StoragePresentationContexts
+
+        for cx in self.ae.supported_contexts:
+            cx.scp_role = True
+            cx.scu_role = False
+
+        # Add a supported presentation context (QR Get SCP)
+        self.ae.add_supported_context(PatientRootQueryRetrieveInformationModelGet)
+        self.ae.add_supported_context(StudyRootQueryRetrieveInformationModelGet)
+        self.ae.add_supported_context(StudyRootQueryRetrieveInformationModelFind)
+
+        self.ae.start_server(("127.0.0.1", port), block=False, evt_handlers=[(evt.EVT_C_FIND, handle_find), (evt.EVT_C_GET, handle_get)])
+
+    def stop(self):
+        """Stop the DICOM server."""
+        self.ae.shutdown()
+
+@pytest.fixture(scope="function")
+def dummy_dataset():
+    ds = Dataset()
+    ds.PatientName = "Test^Patient"
+    ds.PatientID = "12345"
+    ds.StudyDescription = "Test Study"
+    ds.StudyDate = "20210101"
+    ds.StudyInstanceUID = generate_uid()
+    ds.SeriesInstanceUID = generate_uid()
+    ds.AccessionNumber = MOCK_ACCESSION
+    ds.is_little_endian = True
+    ds.is_implicit_VR = False
+    return ds
+
+@pytest.fixture(scope="function")
+def dicom_server(mock_node, dummy_dataset):
+    """
+    Pytest fixture to start a DICOM server before tests and stop it after.
+    This fixture has module scope, so the server will be started once for all tests in the module.
+    """
+    server = DummyDICOMServer(mock_node.port, dummy_dataset)
+    yield mock_node
+    server.stop()
+
+def test_simple_dicom_client(dicom_server):
+    """Test the SimpleDicomClient can connect to and query the DICOM server."""
+    client = SimpleDicomClient(dicom_server.ip, dicom_server.port, dicom_server.aet_target, None)
+
+    result = client.findscu(MOCK_ACCESSION)
+    assert result is not None  # We expect some result, even if it's an empty dataset
+    assert result['AccessionNumber'].value == MOCK_ACCESSION  # Check if the accession number matches
+
+@pytest.fixture(scope="function")
+def tempdir():
+    with tempfile.TemporaryDirectory(prefix="mercure_temp") as d:
+        yield Path(d)
+
+def test_get_accession_job(dicom_server, tempdir, mercure_config):
+    """Test the get_accession_job function."""
+    config = mercure_config()
+    job_id = "test_job"
+    job_kwargs = {
+        "accession": MOCK_ACCESSION,
+        "node": dicom_server,
+        "path": config.jobs_folder
+    }
+    
+    generator = QueryJob.get_accession_job(job_id, job_kwargs)
+    results = list(generator)
+    
+    # Check that we got some results
+    assert len(results) > 0
+    assert results[0][1] == 0
+    assert pydicom.dcmread(next(k for k in Path(config.jobs_folder).iterdir()))['AccessionNumber'].value == MOCK_ACCESSION
+
+def test_query_job(dicom_server, tempdir):
+    """
+    Test the create_job function.
+    We use mocker to mock the queue and avoid actually creating jobs.
+    """
+    queue = Queue(connection=redis)
+    job = create_job([MOCK_ACCESSION], dicom_server, str(tempdir), queue=queue)
+    assert job is not None
+    w = SimpleWorker([queue], connection=redis)
+    w.work(burst=True)
+    # assert len(list(Path(config.mercure.jobs_folder).iterdir())) == 1
+    print([k for k in Path(tempdir).rglob('*')])
+    assert pydicom.dcmread(next(k for k in Path(tempdir).rglob("*.dcm")))['AccessionNumber'].value == MOCK_ACCESSION
+
+def tree(path, prefix='', level=0):
+    """Print a tree representation of the directory."""
+    if not level:
+        print(path)
+    with os.scandir(path) as entries:
+        entries = sorted(entries, key=lambda e: (e.is_file(), e.name))
+        for i, entry in enumerate(entries):
+            conn = '└── ' if i == len(entries) - 1 else '├── '
+            print(f'{prefix}{conn}{entry.name}')
+            if entry.is_dir():
+                tree(entry.path, prefix + ('    ' if i == len(entries) - 1 else '│   '), level+1)
+
+def test_query_dicomweb(receiver_port, tempdir, dummy_dataset, fs):
+    assert isinstance(os, fake_filesystem.FakeOsModule)
+    ds = dummy_dataset.copy()
+    ds.SOPClassUID = CTImageStorage  # CT Image Storage
+    ds.SOPInstanceUID = generate_uid()
+    ds.StudyInstanceUID = generate_uid()
+    ds.file_meta = FileMetaDataset()
+    ds.file_meta.TransferSyntaxUID = ExplicitVRLittleEndian
+    
+    (tempdir / "dicomweb").mkdir()
+    ds.save_as(tempdir / "dicomweb" / "dummy.dcm", write_like_original=False)
+
+    node = DicomWebNode(name="dummy", base_url=f"file://{tempdir}/dicomweb")
+    (tempdir / "outdir").mkdir()
+
+
+    queue = Queue(connection=redis)
+    job = create_job([MOCK_ACCESSION], node, (tempdir / "outdir"), queue=queue)
+    assert job is not None
+    w = SimpleWorker([queue], connection=redis)
+    w.work(burst=True)
+    tree(tempdir / "outdir")
+    outfile = (tempdir / "outdir" / job.id / ds.AccessionNumber /  f"{ds.SOPInstanceUID}.dcm")
+    assert outfile.exists()
\ No newline at end of file
diff --git a/tests/testing_common.py b/tests/testing_common.py
index fe2f66eb..f3dbb427 100755
--- a/tests/testing_common.py
+++ b/tests/testing_common.py
@@ -6,6 +6,7 @@
 import os
 from pathlib import Path
 import shutil
+import socket
 from typing import Callable, Dict, Any, Iterator, Optional, Tuple
 import uuid
 
@@ -101,7 +102,7 @@ def mercure_config(fs) -> Callable[[Dict], Config]:
     config_path = os.path.realpath(os.path.dirname(os.path.realpath(__file__)) + "/data/test_config.json")
 
     fs.add_real_file(config_path, target_path=config.configuration_filename, read_only=False)
-    for k in ["incoming", "studies", "outgoing", "success", "error", "discard", "processing"]:
+    for k in ["incoming", "studies", "outgoing", "success", "error", "discard", "processing", "jobs"]:
         fs.create_dir(f"/var/{k}")
 
     def set_config(extra: Dict[Any, Any] = {}) -> Config:
@@ -235,4 +236,23 @@ def mock_incoming_uid(config, fs, series_uid, tags={}, name="bar", force_tags_ou
 
     # ( incoming / "receiver_info").mkdir(exist_ok=True)
     # ( incoming / "receiver_info" / (series_uid+".received")).touch()
-    return str(dcm_file), tags_f
\ No newline at end of file
+    return str(dcm_file), tags_f
+
+def random_port() -> int:
+    """
+    Generate a free port number to use as an ephemeral endpoint.
+    """
+    s = socket.socket() 
+    s.bind(('',0)) # bind to any available port
+    port = s.getsockname()[1] # get the port number
+    s.close()
+    return int(port)
+
+
+@pytest.fixture(scope="module")
+def receiver_port():
+    return random_port()
+
+@pytest.fixture(scope="module")
+def bookkeeper_port():
+    return random_port()
diff --git a/webinterface/common.py b/webinterface/common.py
index d0692a89..25a35efd 100755
--- a/webinterface/common.py
+++ b/webinterface/common.py
@@ -17,9 +17,6 @@
 from rq_scheduler import Scheduler
 
 redis = Redis()
-
-
-
 worker_queue = Queue(connection=redis)
 worker_scheduler = Scheduler(queue=worker_queue, connection=worker_queue.connection) 
 
diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
index d459ae6a..a7e9f60b 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query.py
@@ -1,7 +1,11 @@
 
+import os
 from pathlib import Path
 import shutil
 from typing import Generator, List, Union, cast
+
+from dicomweb_client import DICOMfileClient
+from common.types import DicomNode, DicomNodeBase, DicomWebNode
 from webinterface.query import SimpleDicomClient
 # Standard python includes
 from datetime import datetime
@@ -20,43 +24,13 @@
 from rq import get_current_job
 from rq.job import Job
 from .common import router
+from dicomweb_client.api import DICOMwebClient
+
 logger = config.get_logger()
 
 
 
-def get_accession_job(job_id, job_kwargs):
-    """
-    
-    """
-    accession, node, path = job_kwargs["accession"], job_kwargs["node"], job_kwargs["path"]
-    config.read_config()
-    c = SimpleDicomClient(node.ip, node.port, node.aet_target, path)
-    # job = get_current_job()
-    # job.meta["started"] = 1
-    # job.save_meta() # type: ignore
-    for identifier in c.getscu(accession):
-        completed, remaining = identifier.NumberOfCompletedSuboperations, identifier.NumberOfRemainingSuboperations, 
-        progress = f"{ completed } / { completed + remaining }" 
-        yield completed, remaining, progress
-    return "Complete"
-
-def check_accessions_exist(*, accessions, node, queue=worker_queue):
-    """
-    Check if the given accessions exist on the node using a DICOM query.
-    """
-    c = SimpleDicomClient(node.ip, node.port, node.aet_target, None)
-    try:
-        for accession in accessions:
-            result = c.findscu(accession)
-            logger.info(result)
-    except:
-        job = get_current_job()
-        if not job:
-            raise Exception("No current job found")
-        job_parent = queue.fetch_job(job.meta.get('parent'))
-        job_parent.meta['failed_reason'] = f"Accession {accession} not found on node"
-        queue._enqueue_job(job_parent,at_front=True)
-        raise
+
 def query_dummy(job_id, job_kwargs):
     """
     Dummy function to simulate a long-running task.
@@ -79,6 +53,35 @@ def query_dummy(job_id, job_kwargs):
         yield completed, remaining, f"{completed} / {remaining + completed}"
 
 class QueryJob():
+    @classmethod 
+    def get_accession_job(cls, job_id, job_kwargs):
+        accession, node, path = job_kwargs["accession"], job_kwargs["node"], job_kwargs["path"]
+        config.read_config()
+        c = SimpleDicomClient(node.ip, node.port, node.aet_target, path)
+        for identifier in c.getscu(accession):
+            completed, remaining = identifier.NumberOfCompletedSuboperations, identifier.NumberOfRemainingSuboperations, 
+            progress = f"{ completed } / { completed + remaining }" 
+            yield completed, remaining, progress
+        return "Complete"
+
+    @classmethod
+    def check_accessions_exist(cls, *, accessions, node, queue=worker_queue):
+        """
+        Check if the given accessions exist on the node using a DICOM query.
+        """
+        c = SimpleDicomClient(node.ip, node.port, node.aet_target, None)
+        try:
+            for accession in accessions:
+                result = c.findscu(accession)
+                logger.info(result)
+        except:
+            job = get_current_job()
+            if not job:
+                raise Exception("No current job found")
+            job_parent = queue.fetch_job(job.meta.get('parent'))
+            job_parent.meta['failed_reason'] = f"Accession {accession} not found on node"
+            queue._enqueue_job(job_parent,at_front=True)
+            raise
 
     @classmethod
     def get_accessions(cls, *,accession, node, path, perform_func=query_dummy,queue=worker_queue):
@@ -131,21 +134,81 @@ def get_accessions(cls, *,accession, node, path, perform_func=query_dummy,queue=
 
         return "Job complete"
 
-def move_to_destination(path, destination, job_id) -> None:
-    """
+class DicomWebQueryJob(QueryJob):
+    @classmethod 
+    def get_accession_job(cls, job_id, job_kwargs):
+        accession, node, path = job_kwargs["accession"], job_kwargs["node"], job_kwargs["path"]
+        config.read_config()
+        if node.base_url.startswith("file://"):
+            client = DICOMfileClient(url=node.base_url, in_memory=True)
+        else:
+            client = DICOMwebClient(node.base_url)
+        series = client.search_for_series(search_filters={'AccessionNumber': accession})
+        if not series:
+            raise ValueError("No series found with accession number {}".format(accession))
+        n = 0
+        remaining = 0
+        for s in series:
+            instances = client.retrieve_series(s['0020000D']['Value'][0], s['0020000E']['Value'][0])
+            remaining += len(instances)
+            for instance in instances:
+                sop_instance_uid = instance.get('SOPInstanceUID')
+                filename = f"{path}/{sop_instance_uid}.dcm"
+                instance.save_as(filename)
+                n += 1
+                remaining -= 1
+                yield (n, remaining, f'{n} / {n + remaining}')
 
-    """
+    @classmethod
+    def check_accessions_exist(cls, *, accessions, node: DicomWebNode, queue=worker_queue): 
+        if node.base_url.startswith("file://"):
+            client = DICOMfileClient(url=node.base_url, update_db=True, in_memory=True)
+        else:
+            client = DICOMwebClient(node.base_url)
+        for accession in accessions:
+            try:
+                response = client.search_for_series(search_filters={'AccessionNumber': accession})
+                if not response:
+                    print(client.search_for_series())
+                    raise ValueError("No series found with accession number {}".format(accession))
+            except Exception as e:
+                job = get_current_job()
+                if not job:
+                    raise Exception("No current job found")
+                job_parent = queue.fetch_job(job.meta.get('parent'))
+                job_parent.meta['failed_reason'] = f"Accession {accession} not found on node"
+                queue._enqueue_job(job_parent,at_front=True)
+                raise
+        return "Complete"
+
+def tree(path, prefix='', level=0):
+    if level==0:
+        logger.info(path)
+    with os.scandir(path) as entries:
+        entries = sorted(entries, key=lambda e: (e.is_file(), e.name))
+        if not entries and level==0:
+            logger.info(prefix + "[[ empty ]]")
+        for i, entry in enumerate(entries):
+            conn = '└── ' if i == len(entries) - 1 else '├── '
+            logger.info(f'{prefix}{conn}{entry.name}')
+            if entry.is_dir():
+                tree(entry.path, prefix + ('    ' if i == len(entries) - 1 else '│   '), level+1)
+
+def move_to_destination(path, destination, job_id) -> None:
     if destination is None:
         config.read_config()
         for p in Path(path).glob("**/*"):
             if p.is_file():
                 shutil.move(str(p), config.mercure.incoming_folder) # Move the file to incoming folder
+        tree(config.mercure.incoming_folder)
         shutil.rmtree(path)
     else:
         dest_folder: Path = Path(destination) / job_id
         dest_folder.mkdir(exist_ok=True)
         logger.info(f"moving {path} to {dest_folder}")
         shutil.move(path, dest_folder)
+        tree(dest_folder)
+        logger.info(f"moved")
 
 def batch_job(*, accessions, subjobs, path, destination, move_promptly, queue=worker_queue) -> str:
     job = get_current_job()
@@ -162,10 +225,13 @@ def batch_job(*, accessions, subjobs, path, destination, move_promptly, queue=wo
     logger.info(f"Job completing {job.id}")
 
     if not move_promptly:
+        logger.info("Moving files during completion as move_promptly==False")
         for p in Path(path).iterdir():
             if not p.is_dir():
                 continue
             move_to_destination(p, destination, job.id)
+    logger.info(f"Removing job directory {path}")
+    tree(destination)
     shutil.rmtree(path)
 
     return "Job complete"
@@ -203,17 +269,22 @@ def resume_job(job: Job, queue=worker_queue):
     job.meta['paused'] = False
     job.save_meta() # type: ignore
 
-def create_job(accessions, dicom_node, destination_path, offpeak=False, queue=worker_queue) -> Job:
+def create_job(accessions, dicom_node: DicomNodeBase, destination_path, offpeak=False, queue=worker_queue) -> Job:
     """
     Create a job to process the given accessions and store them in the specified destination path.
     """
+    if isinstance(dicom_node, DicomNode):
+        JobClass = QueryJob 
+    elif isinstance(dicom_node, DicomWebNode):
+        JobClass = DicomWebQueryJob
+
     with Connection(redis):
         jobs: List[Job] = []
-        check_job = Job.create(check_accessions_exist, kwargs=dict(accessions=accessions,node=dicom_node), meta=dict(parent=None))
+        check_job = Job.create(JobClass.check_accessions_exist, kwargs=dict(accessions=accessions,node=dicom_node), meta=dict(parent=None))
 
         for accession in accessions:
-            job = Job.create(QueryJob.get_accessions, 
-                             kwargs=dict(perform_func=get_accession_job, accession=accession, node=dicom_node), timeout=30*60, result_ttl=-1, 
+            job = Job.create(JobClass.get_accessions, 
+                             kwargs=dict(perform_func=JobClass.get_accession_job, accession=accession, node=dicom_node), timeout=30*60, result_ttl=-1, 
                              meta=dict(type="get_accession_batch",parent=None, paused=False, offpeak=offpeak),
                              depends_on=cast(List[Union[Dependency, Job]],[check_job])
                              )
@@ -226,9 +297,10 @@ def create_job(accessions, dicom_node, destination_path, offpeak=False, queue=wo
         check_job.meta["parent"] = full_job.id
         for j in jobs:
             j.meta["parent"] = full_job.id
-            j.kwargs["path"] = f"/opt/mercure/data/query/job_dirs/{full_job.id}/{j.kwargs['accession']}"
-        full_job.kwargs["path"] = Path(f"/opt/mercure/data/query/job_dirs/{full_job.id}")
-        full_job.kwargs["path"].mkdir(parents=True)
+            j.kwargs["path"] = Path(config.mercure.jobs_folder) / full_job.id / j.kwargs['accession']
+            j.kwargs["path"].mkdir(parents=True)
+
+        full_job.kwargs["path"] = Path(config.mercure.jobs_folder) / full_job.id
 
     queue.enqueue_job(check_job)
     for j in jobs:
@@ -399,7 +471,7 @@ async def query_post_batch(request):
     create_job(form.get("accession").split(","), node, dest_path, offpeak=offpeak)
     # worker_scheduler.schedule(scheduled_time=datetime.utcnow(), func=monitor_job, interval=10, repeat=10, result_ttl=-1)
     return PlainTextResponse()
-
+ 
 @router.post("/query_single")
 @requires(["authenticated", "admin"], redirect="login")
 async def query_post(request):
@@ -412,7 +484,7 @@ async def query_post(request):
             node = n
             break
     
-    worker_queue.enqueue_call(get_accession_job, kwargs=dict(accession=form.get("accession"), node=node), timeout=30*60, result_ttl=-1, meta=dict(type="get_accession_single"))
+    worker_queue.enqueue_call(QueryJob.get_accession_job, kwargs=dict(accession=form.get("accession"), node=node), timeout=30*60, result_ttl=-1, meta=dict(type="get_accession_single"))
     return PlainTextResponse()
 
 
diff --git a/webinterface/query.py b/webinterface/query.py
index 54b87d4d..9294174a 100644
--- a/webinterface/query.py
+++ b/webinterface/query.py
@@ -91,7 +91,7 @@ def handle_store(self, event):
         except KeyError:
             mode_prefix = "UN"
 
-        filename = f"{self.output_dir}/{mode_prefix}.{sop_instance}"
+        filename = f"{self.output_dir}/{mode_prefix}.{sop_instance}.dcm"
         print(f"Storing DICOM file: {filename}")
 
         status_ds = Dataset()
@@ -120,7 +120,7 @@ def handle_store(self, event):
             # Failed - Out of Resources - Miscellaneous error
             status_ds.Status = 0xA701
 
-        subprocess.run(["/opt/mercure/app/bin/ubuntu22.04/getdcmtags", filename, self.called_aet, "MERCURE"]) 
+        subprocess.run(["./bin/ubuntu22.04/getdcmtags", filename, self.called_aet, "MERCURE"],check=True)
         return status_ds
 
 

From c4490b7c80e3c4e204b26b01c4164fb5e76a493d Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Tue, 27 Aug 2024 17:51:01 +0000
Subject: [PATCH 22/42] refactor query

---
 common/types.py                  |   2 +-
 tests/test_query.py              |  45 ++--
 webinterface/dashboards/query.py | 343 ++++++++++++++++++-------------
 3 files changed, 220 insertions(+), 170 deletions(-)

diff --git a/common/types.py b/common/types.py
index d45d819d..ac5cd68e 100755
--- a/common/types.py
+++ b/common/types.py
@@ -191,7 +191,7 @@ def __get_validators__(cls):
     @classmethod
     def validate(cls, v):
         """Parse the target as any of the known target types."""
-        subclass_dict: typing.Dict[str, Type[DicomNode]] = {sbc.__name__: sbc for sbc in cls.__subclasses__()}
+        subclass_dict: typing.Dict[str, Type[DicomNodeBase]] = {sbc.__name__: sbc for sbc in cls.__subclasses__()}
         for k in subclass_dict:
             try:
                 return subclass_dict[k](**v)
diff --git a/tests/test_query.py b/tests/test_query.py
index 5d534977..a9d400d0 100644
--- a/tests/test_query.py
+++ b/tests/test_query.py
@@ -4,12 +4,12 @@
 import pydicom
 import pytest
 from pynetdicom import AE, evt, StoragePresentationContexts, build_role
-from pynetdicom.sop_class import Verification, StudyRootQueryRetrieveInformationModelFind, StudyRootQueryRetrieveInformationModelGet,PatientRootQueryRetrieveInformationModelGet,  CTImageStorage
+from pynetdicom.sop_class import Verification, StudyRootQueryRetrieveInformationModelFind, StudyRootQueryRetrieveInformationModelGet,PatientRootQueryRetrieveInformationModelGet,  CTImageStorage # type: ignore
 from pynetdicom.status import Status
 from pydicom.uid import generate_uid
 from pydicom.dataset import Dataset, FileMetaDataset
 from rq import Worker
-from webinterface.dashboards.query import SimpleDicomClient, QueryJob, create_job
+from webinterface.dashboards.query import SimpleDicomClient, QueryJob, WrappedJob
 from common.types import DicomNode, DicomWebNode
 from webinterface.common import redis, worker_queue
 from pyfakefs import fake_filesystem
@@ -46,14 +46,6 @@ def handle_find(event):
             else:
                 yield (0x0000, None)  # Status 'Success', but no match
 
-        def handle_find(event):
-            ds = event.identifier
-            # Check if the request matches our dummy data
-            if 'AccessionNumber' in ds and ds.AccessionNumber == MOCK_ACCESSION:
-                yield (0xFF00, self.dataset)
-            else:
-                yield (0x0000, None)  # Status 'Success', but no match
-
         # Define handler for C-GET requests
         def handle_get(event):
             ds = event.identifier
@@ -66,7 +58,7 @@ def handle_get(event):
                 dummy_ds = self.dataset.copy()
                 dummy_ds.SOPClassUID = CTImageStorage  # CT Image Storage
                 dummy_ds.SOPInstanceUID = generate_uid()
-                dummy_ds.file_meta = Dataset()
+                dummy_ds.file_meta = FileMetaDataset()
                 dummy_ds.file_meta.TransferSyntaxUID = ExplicitVRLittleEndian
 
                 # Yield the dataset
@@ -90,7 +82,7 @@ def handle_get(event):
 
         self.ae.start_server(("127.0.0.1", port), block=False, evt_handlers=[(evt.EVT_C_FIND, handle_find), (evt.EVT_C_GET, handle_get)])
 
-    def stop(self):
+    def stop(self)->None:
         """Stop the DICOM server."""
         self.ae.shutdown()
 
@@ -155,25 +147,26 @@ def test_query_job(dicom_server, tempdir):
     We use mocker to mock the queue and avoid actually creating jobs.
     """
     queue = Queue(connection=redis)
-    job = create_job([MOCK_ACCESSION], dicom_server, str(tempdir), queue=queue)
-    assert job is not None
+    job = WrappedJob.create([MOCK_ACCESSION], dicom_server, str(tempdir), queue=queue)
+    assert job
     w = SimpleWorker([queue], connection=redis)
     w.work(burst=True)
     # assert len(list(Path(config.mercure.jobs_folder).iterdir())) == 1
     print([k for k in Path(tempdir).rglob('*')])
     assert pydicom.dcmread(next(k for k in Path(tempdir).rglob("*.dcm")))['AccessionNumber'].value == MOCK_ACCESSION
 
-def tree(path, prefix='', level=0):
-    """Print a tree representation of the directory."""
-    if not level:
+def tree(path, prefix='', level=0) -> None:
+    if level==0:
         print(path)
-    with os.scandir(path) as entries:
-        entries = sorted(entries, key=lambda e: (e.is_file(), e.name))
-        for i, entry in enumerate(entries):
-            conn = '└── ' if i == len(entries) - 1 else '├── '
-            print(f'{prefix}{conn}{entry.name}')
-            if entry.is_dir():
-                tree(entry.path, prefix + ('    ' if i == len(entries) - 1 else '│   '), level+1)
+    entries = list(os.listdir(path))
+    entries = sorted(entries, key=lambda e: (e.is_file(), e.name))
+    if not entries and level==0:
+        print(prefix + "[[ empty ]]")
+    for i, entry in enumerate(entries):
+        conn = '└── ' if i == len(entries) - 1 else '├── '
+        print(f'{prefix}{conn}{entry.name}')
+        if entry.is_dir():
+            tree(entry.path, prefix + ('    ' if i == len(entries) - 1 else '│   '), level+1)
 
 def test_query_dicomweb(receiver_port, tempdir, dummy_dataset, fs):
     assert isinstance(os, fake_filesystem.FakeOsModule)
@@ -192,10 +185,10 @@ def test_query_dicomweb(receiver_port, tempdir, dummy_dataset, fs):
 
 
     queue = Queue(connection=redis)
-    job = create_job([MOCK_ACCESSION], node, (tempdir / "outdir"), queue=queue)
+    job = WrappedJob.create([MOCK_ACCESSION], node, (tempdir / "outdir"), queue=queue)
     assert job is not None
     w = SimpleWorker([queue], connection=redis)
     w.work(burst=True)
-    tree(tempdir / "outdir")
+    # tree(tempdir / "outdir")
     outfile = (tempdir / "outdir" / job.id / ds.AccessionNumber /  f"{ds.SOPInstanceUID}.dcm")
     assert outfile.exists()
\ No newline at end of file
diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
index a7e9f60b..40ea21c1 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query.py
@@ -2,7 +2,8 @@
 import os
 from pathlib import Path
 import shutil
-from typing import Generator, List, Union, cast
+from typing import Any, Dict, Generator, List, Tuple, Union, cast
+import typing
 
 from dicomweb_client import DICOMfileClient
 from common.types import DicomNode, DicomNodeBase, DicomWebNode
@@ -20,7 +21,7 @@
 from starlette.responses import PlainTextResponse, JSONResponse
 from webinterface.common import worker_queue, redis
 from rq import Connection 
-from rq.job import Dependency
+from rq.job import Dependency, JobStatus
 from rq import get_current_job
 from rq.job import Job
 from .common import router
@@ -54,7 +55,7 @@ def query_dummy(job_id, job_kwargs):
 
 class QueryJob():
     @classmethod 
-    def get_accession_job(cls, job_id, job_kwargs):
+    def get_accession_job(cls, job_id, job_kwargs) -> Generator[Tuple[int,int,str], None, str]:
         accession, node, path = job_kwargs["accession"], job_kwargs["node"], job_kwargs["path"]
         config.read_config()
         c = SimpleDicomClient(node.ip, node.port, node.aet_target, path)
@@ -139,10 +140,9 @@ class DicomWebQueryJob(QueryJob):
     def get_accession_job(cls, job_id, job_kwargs):
         accession, node, path = job_kwargs["accession"], job_kwargs["node"], job_kwargs["path"]
         config.read_config()
-        if node.base_url.startswith("file://"):
-            client = DICOMfileClient(url=node.base_url, in_memory=True)
-        else:
-            client = DICOMwebClient(node.base_url)
+        client = (DICOMfileClient(url=node.base_url, in_memory=True) if node.base_url.startswith("file://") 
+                  else DICOMwebClient(node.base_url))
+        assert isinstance(client, (DICOMwebClient, DICOMfileClient))
         series = client.search_for_series(search_filters={'AccessionNumber': accession})
         if not series:
             raise ValueError("No series found with accession number {}".format(accession))
@@ -161,10 +161,10 @@ def get_accession_job(cls, job_id, job_kwargs):
 
     @classmethod
     def check_accessions_exist(cls, *, accessions, node: DicomWebNode, queue=worker_queue): 
-        if node.base_url.startswith("file://"):
-            client = DICOMfileClient(url=node.base_url, update_db=True, in_memory=True)
-        else:
-            client = DICOMwebClient(node.base_url)
+        client = (DICOMfileClient(url=node.base_url, in_memory=True) if node.base_url.startswith("file://") 
+                  else DICOMwebClient(node.base_url))
+        assert isinstance(client, (DICOMwebClient, DICOMfileClient))
+
         for accession in accessions:
             try:
                 response = client.search_for_series(search_filters={'AccessionNumber': accession})
@@ -181,18 +181,18 @@ def check_accessions_exist(cls, *, accessions, node: DicomWebNode, queue=worker_
                 raise
         return "Complete"
 
-def tree(path, prefix='', level=0):
-    if level==0:
-        logger.info(path)
-    with os.scandir(path) as entries:
-        entries = sorted(entries, key=lambda e: (e.is_file(), e.name))
-        if not entries and level==0:
-            logger.info(prefix + "[[ empty ]]")
-        for i, entry in enumerate(entries):
-            conn = '└── ' if i == len(entries) - 1 else '├── '
-            logger.info(f'{prefix}{conn}{entry.name}')
-            if entry.is_dir():
-                tree(entry.path, prefix + ('    ' if i == len(entries) - 1 else '│   '), level+1)
+# def tree(path, prefix='', level=0) -> None:
+#     if level==0:
+#         logger.info(path)
+#     entries = list(os.listdir(path))
+#     entries = sorted(entries, key=lambda e: (e.is_file(), e.name))
+#     if not entries and level==0:
+#         logger.info(prefix + "[[ empty ]]")
+#     for i, entry in enumerate(entries):
+#         conn = '└── ' if i == len(entries) - 1 else '├── '
+#         logger.info(f'{prefix}{conn}{entry.name}')
+#         if entry.is_dir():
+#             tree(entry.path, prefix + ('    ' if i == len(entries) - 1 else '│   '), level+1)
 
 def move_to_destination(path, destination, job_id) -> None:
     if destination is None:
@@ -200,14 +200,14 @@ def move_to_destination(path, destination, job_id) -> None:
         for p in Path(path).glob("**/*"):
             if p.is_file():
                 shutil.move(str(p), config.mercure.incoming_folder) # Move the file to incoming folder
-        tree(config.mercure.incoming_folder)
+        # tree(config.mercure.incoming_folder)
         shutil.rmtree(path)
     else:
         dest_folder: Path = Path(destination) / job_id
         dest_folder.mkdir(exist_ok=True)
         logger.info(f"moving {path} to {dest_folder}")
         shutil.move(path, dest_folder)
-        tree(dest_folder)
+        # tree(dest_folder)
         logger.info(f"moved")
 
 def batch_job(*, accessions, subjobs, path, destination, move_promptly, queue=worker_queue) -> str:
@@ -231,126 +231,184 @@ def batch_job(*, accessions, subjobs, path, destination, move_promptly, queue=wo
                 continue
             move_to_destination(p, destination, job.id)
     logger.info(f"Removing job directory {path}")
-    tree(destination)
+    # tree(destination)
     shutil.rmtree(path)
 
     return "Job complete"
 
-
-
 def monitor_job():
     print("monitoring")
 
-def pause_job(job: Job, queue=worker_queue):
-    """
-    Pause the current job, including all its subjobs.
-    """
-    for job_id in job.kwargs.get('subjobs',[]):
-        subjob = queue.fetch_job(job_id)
-        if subjob and (subjob.is_deferred or subjob.is_queued):
-            subjob.meta['paused'] = True
-            subjob.save_meta() # type: ignore
-            subjob.cancel()
-    job.get_meta()
-    job.meta['paused'] = True
-    job.save_meta() # type: ignore
-
-def resume_job(job: Job, queue=worker_queue):
-    """
-    Resume a paused job by unpausing all its subjobs
-    """
-    for subjob_id in job.kwargs.get('subjobs',[]):
-        subjob = queue.fetch_job(subjob_id)
-        if subjob and subjob.meta.get('paused', None):
-            subjob.meta['paused'] = False
-            subjob.save_meta() # type: ignore
-            queue.canceled_job_registry.requeue(subjob_id)
-    job.get_meta()
-    job.meta['paused'] = False
-    job.save_meta() # type: ignore
+class WrappedJob():
+    def __init__(self, job: Union[Job,str], queue):
+        if isinstance(job, str):
+            self.job = queue.fetch_job(job)
+        else:
+            self.job = job
+        self.queue = queue
 
-def create_job(accessions, dicom_node: DicomNodeBase, destination_path, offpeak=False, queue=worker_queue) -> Job:
-    """
-    Create a job to process the given accessions and store them in the specified destination path.
-    """
-    if isinstance(dicom_node, DicomNode):
-        JobClass = QueryJob 
-    elif isinstance(dicom_node, DicomWebNode):
-        JobClass = DicomWebQueryJob
+    @classmethod
+    def create(cls, accessions, dicom_node: DicomNodeBase, destination_path, offpeak=False, queue=worker_queue) -> 'WrappedJob':
+        """
+        Create a job to process the given accessions and store them in the specified destination path.
+        """
+        if isinstance(dicom_node, DicomNode):
+            JobClass = QueryJob 
+        elif isinstance(dicom_node, DicomWebNode):
+            JobClass = DicomWebQueryJob
 
-    with Connection(redis):
-        jobs: List[Job] = []
-        check_job = Job.create(JobClass.check_accessions_exist, kwargs=dict(accessions=accessions,node=dicom_node), meta=dict(parent=None))
+        with Connection(redis):
+            jobs: List[Job] = []
+            check_job = Job.create(JobClass.check_accessions_exist, kwargs=dict(accessions=accessions,node=dicom_node), meta=dict(parent=None))
 
-        for accession in accessions:
-            job = Job.create(JobClass.get_accessions, 
-                             kwargs=dict(perform_func=JobClass.get_accession_job, accession=accession, node=dicom_node), timeout=30*60, result_ttl=-1, 
-                             meta=dict(type="get_accession_batch",parent=None, paused=False, offpeak=offpeak),
-                             depends_on=cast(List[Union[Dependency, Job]],[check_job])
-                             )
-            jobs.append(job)
-        depends = Dependency(
-            jobs=cast(List[Union[Job,str]],jobs),
-            allow_failure=True,    # allow_failure defaults to False
-        )
-        full_job = Job.create(batch_job, kwargs=dict(accessions=accessions, subjobs=[j.id for j in jobs], destination=destination_path, move_promptly=True), timeout=-1, result_ttl=-1, meta=dict(type="batch", started=0, paused=False,completed=0, total=len(jobs), offpeak=offpeak), depends_on=depends)
-        check_job.meta["parent"] = full_job.id
+            for accession in accessions:
+                job = Job.create(JobClass.get_accessions, 
+                                kwargs=dict(perform_func=JobClass.get_accession_job, accession=accession, node=dicom_node), timeout=30*60, result_ttl=-1, 
+                                meta=dict(type="get_accession_batch",parent=None, paused=False, offpeak=offpeak),
+                                depends_on=cast(List[Union[Dependency, Job]],[check_job])
+                                )
+                jobs.append(job)
+            depends = Dependency(
+                jobs=cast(List[Union[Job,str]],jobs),
+                allow_failure=True,    # allow_failure defaults to False
+            )
+            full_job = Job.create(batch_job, 
+                                  kwargs=dict(accessions=accessions, 
+                                              subjobs=[j.id for j in jobs],
+                                              destination=destination_path, 
+                                              move_promptly=True), 
+                                  meta=dict(type="batch", started=0, paused=False,completed=0, total=len(jobs), offpeak=offpeak),
+                                  depends_on=depends,
+                                  timeout=-1, result_ttl=-1)
+            check_job.meta["parent"] = full_job.id
+            for j in jobs:
+                j.meta["parent"] = full_job.id
+                j.kwargs["path"] = Path(config.mercure.jobs_folder) / full_job.id / j.kwargs['accession']
+                j.kwargs["path"].mkdir(parents=True)
+
+            full_job.kwargs["path"] = Path(config.mercure.jobs_folder) / full_job.id
+
+        queue.enqueue_job(check_job)
         for j in jobs:
-            j.meta["parent"] = full_job.id
-            j.kwargs["path"] = Path(config.mercure.jobs_folder) / full_job.id / j.kwargs['accession']
-            j.kwargs["path"].mkdir(parents=True)
+            queue.enqueue_job(j)
+        queue.enqueue_job(full_job)
 
-        full_job.kwargs["path"] = Path(config.mercure.jobs_folder) / full_job.id
+        wrapped_job = WrappedJob(full_job, queue=queue)
+        if offpeak and not _is_offpeak(config.mercure.offpeak_start, config.mercure.offpeak_end, datetime.now().time()):
+            wrapped_job.pause()
 
-    queue.enqueue_job(check_job)
-    for j in jobs:
-        queue.enqueue_job(j)
-    queue.enqueue_job(full_job)
+        return wrapped_job
 
-    if offpeak and not _is_offpeak(config.mercure.offpeak_start, config.mercure.offpeak_end, datetime.now().time()):
-        pause_job(full_job)
+    def __bool__(self) -> bool:
+        return bool(self.job)
 
-    return full_job
+    def pause(self) -> None:
+        """
+        Pause the current job, including all its subjobs.
+        """
+        for job_id in self.job.kwargs.get('subjobs',[]):
+            subjob = self.queue.fetch_job(job_id)
+            if subjob and (subjob.is_deferred or subjob.is_queued):
+                subjob.meta['paused'] = True
+                subjob.save_meta() # type: ignore
+                subjob.cancel()
+        self.job.get_meta()
+        self.job.meta['paused'] = True
+        self.job.save_meta() # type: ignore
+
+    def resume(self) -> None:
+        """
+        Resume a paused job by unpausing all its subjobs
+        """
+        for subjob_id in self.job.kwargs.get('subjobs',[]):
+            subjob = self.job.fetch_job(subjob_id)
+            if subjob and subjob.meta.get('paused', None):
+                subjob.meta['paused'] = False
+                subjob.save_meta() # type: ignore
+                self.queue.canceled_job_registry.requeue(subjob_id)
+        self.job.get_meta()
+        self.job.meta['paused'] = False
+        self.job.save_meta() # type: ignore
+
+    def retry(self) -> None:
+        """
+        Retry a failed job by enqueuing it again
+        """
+        # job.meta["retries"] = job.meta.get("retries", 0) + 1
+        # if job.meta["retries"] > 3:
+        #     return False
+        logger.info(f"Retrying {self.job}")
+        for subjob in self.get_subjobs():
+            if (status:=self.job.get_status()) in ("failed", "canceled"):
+                logger.info(f"Retrying {subjob}")
+                if status == "failed" and (job_path:=Path(subjob.kwargs['path'])).exists():
+                    shutil.rmtree(job_path) # Clean up after a failed job
+                self.queue.enqueue_job(subjob)
+        self.queue.enqueue_job(self.job)
+
+    def get_subjobs(self) -> Generator[Job, None, None]:
+        return (self.queue.fetch_job(job) for job in self.job.kwargs.get('subjobs', []) if job)
+
+    def get_status(self) -> JobStatus:
+        return cast(JobStatus,self.job.get_status())
+
+    def get_meta(self) -> Any:
+        return cast(dict,self.job.get_meta())
+        
+    @property
+    def meta(self) -> typing.Dict:
+        return cast(dict, self.job.meta)
+    
+    @property
+    def is_failed(self) -> bool:
+        return cast(bool,self.job.is_failed)
 
-def retry_job(job, queue=worker_queue) -> None:
-    """
-    Retry a failed job by enqueuing it again
-    """
-    # job.meta["retries"] = job.meta.get("retries", 0) + 1
-    # if job.meta["retries"] > 3:
-    #     return False
-    logger.info(f"Retrying {job}")
-    for subjob in get_subjobs(job):
-        if (status:=job.get_status()) in ("failed", "canceled"):
-            logger.info(f"Retrying {subjob}")
-            if status == "failed" and (job_path:=Path(subjob.kwargs['path'])).exists():
-                shutil.rmtree(job_path) # Clean up after a failed job
-            queue.enqueue_job(subjob)
-    queue.enqueue_job(job)
-def get_subjobs(job, queue=worker_queue) -> Generator:
-    return (queue.fetch_job(job) for job in job.kwargs.get('subjobs', []))
-
-def get_all_jobs(type, queue=worker_queue) -> Generator:
-    """
-    Get all jobs of a given type from the queue
-    """
-    registries = [
-        queue.started_job_registry,  # Returns StartedJobRegistry
-        queue.deferred_job_registry,   # Returns DeferredJobRegistry
-        queue.finished_job_registry,  # Returns FinishedJobRegistry
-        queue.failed_job_registry,  # Returns FailedJobRegistry 
-        queue.scheduled_job_registry,  # Returns ScheduledJobRegistry
-        queue.canceled_job_registry,   # Returns CanceledJobRegistry
-    ]
-    job_ids = set()
-    for registry in registries:
-        for j_id in registry.get_job_ids():
+    @property
+    def is_finished(self) -> bool:
+        return cast(bool,self.job.is_finished)
+    
+    @property
+    def id(self) -> str:
+        return cast(str,self.job.id)
+
+    @property
+    def kwargs(self) -> typing.Dict:
+        return cast(dict,self.job.kwargs)
+    
+    @property
+    def result(self) -> Any:
+        return self.job.result
+    
+    @property
+    def created_at(self) -> datetime:
+        return cast(datetime,self.job.created_at)
+    
+    @property
+    def enqueued_at(self) -> datetime:
+        return cast(datetime,self.job.enqueued_at)
+
+    @classmethod
+    def get_all_jobs(cls, type:str="batch", queue=worker_queue) -> Generator['WrappedJob', None, None]:
+        """
+        Get all jobs of a given type from the queue
+        """
+        registries = [
+            queue.started_job_registry,  # Returns StartedJobRegistry
+            queue.deferred_job_registry,   # Returns DeferredJobRegistry
+            queue.finished_job_registry,  # Returns FinishedJobRegistry
+            queue.failed_job_registry,  # Returns FailedJobRegistry 
+            queue.scheduled_job_registry,  # Returns ScheduledJobRegistry
+            queue.canceled_job_registry,   # Returns CanceledJobRegistry
+        ]
+        job_ids = set()
+        for registry in registries:
+            for j_id in registry.get_job_ids():
+                job_ids.add(j_id)
+        for j_id in queue.job_ids:
             job_ids.add(j_id)
-    for j_id in queue.job_ids:
-        job_ids.add(j_id)
-    jobs = (queue.fetch_job(j_id) for j_id in job_ids)
+        jobs = (queue.fetch_job(j_id) for j_id in job_ids)
 
-    return (j for j in jobs if j.get_meta().get("type") == type)
+        return (WrappedJob(j,queue) for j in jobs if j.get_meta().get("type") == type)
 
 def _is_offpeak(offpeak_start: str, offpeak_end: str, current_time) -> bool:
     try:
@@ -372,7 +430,7 @@ def update_jobs_offpeak(queue=worker_queue):
     config.read_config()
     is_offpeak = _is_offpeak(config.mercure.offpeak_start, config.mercure.offpeak_end, datetime.now().time())
     logger.info(f"is_offpeak {is_offpeak}")
-    for job in get_all_jobs("batch", queue=queue):
+    for job in WrappedJob.get_all_jobs(queue=queue):
         if not job.meta.get("offpeak"):
             continue
         if job.get_status() not in ("waiting", "running", "queued", "deferred"):
@@ -382,53 +440,52 @@ def update_jobs_offpeak(queue=worker_queue):
             logger.info(f"{job.meta}, {job.get_status()}")
             if job.meta.get("paused", False):
                 logger.info("Resuming")
-                resume_job(job, queue=queue)
+                job.resume()
         else:
             if not job.meta.get("paused", False):
                 logger.info("Pausing")
-                pause_job(job, queue=queue)
-
+                job.pause()
+ 
 @router.post("/query/retry_job")
 @requires(["authenticated", "admin"], redirect="login")
 async def post_retry_job(request):
-    job = worker_queue.fetch_job(request.query_params['id'])
-    retry_job(job)
+    job = WrappedJob(request.query_params['id'], queue=worker_queue)
+    job.retry()
     return JSONResponse({})
 
 @router.post("/query/pause_job")
 @requires(["authenticated", "admin"], redirect="login")
 async def post_pause_job(request):
-    job = worker_queue.fetch_job(request.query_params['id'])
+    job = WrappedJob(request.query_params['id'], queue=worker_queue)
     if not job:
         return JSONResponse({'error': 'Job not found'}, status_code=404)
     if job.is_finished or job.is_failed:
         return JSONResponse({'error': 'Job is already finished'}, status_code=400)
-    pause_job(job)
+    job.pause()
     return JSONResponse({'status': 'success'}, status_code=200)
 
 @router.post("/query/resume_job")
 @requires(["authenticated", "admin"], redirect="login")
 async def post_resume_job(request):
-    job = worker_queue.fetch_job(request.query_params['id'])
+    job = WrappedJob(request.query_params['id'], queue=worker_queue)
     if not job:
         return JSONResponse({'error': 'Job not found'}, status_code=404)
     if job.is_finished or job.is_failed:
         return JSONResponse({'error': 'Job is already finished'}, status_code=400)
     
-    resume_job(job)
+    job.resume()
     return JSONResponse({'status': 'success'}, status_code=200)
 
 @router.get("/query/job_info")
 @requires(["authenticated", "admin"], redirect="login")
 async def get_job_info(request):
     job_id = request.query_params['id']
-    job = worker_queue.fetch_job(job_id)
+    job = WrappedJob(job_id, queue=worker_queue)
     if not job:
         return JSONResponse({'error': 'Job not found'}, status_code=404)
     
-    subjob_info = []
-    subjobs = (worker_queue.fetch_job(job) for job in job.kwargs.get('subjobs', []))
-    for subjob in subjobs:
+    subjob_info:List[Dict[str,Any]] = []
+    for subjob in job.get_subjobs():
         if not subjob:
             continue
         info = {
@@ -468,7 +525,7 @@ async def query_post_batch(request):
 
     # random_accessions = ["".join(random.choices([str(i) for i in range(10)], k=10)) for _ in range(3)]
     offpeak = 'offpeak' in form
-    create_job(form.get("accession").split(","), node, dest_path, offpeak=offpeak)
+    WrappedJob.create(form.get("accession").split(","), node, dest_path, offpeak=offpeak)
     # worker_scheduler.schedule(scheduled_time=datetime.utcnow(), func=monitor_job, interval=10, repeat=10, result_ttl=-1)
     return PlainTextResponse()
  
@@ -495,7 +552,7 @@ async def query_jobs(request):
     Returns a list of all query jobs. 
     """
     job_info = []
-    for job in get_all_jobs("batch"):
+    for job in WrappedJob.get_all_jobs():
         job_dict = dict(id=job.id, 
                                 status=job.get_status(), 
                                 parameters=dict(accession=job.kwargs.get('accession','')), 

From 3c183a7ed48e0a605d8bdae4be086a6e1fb8fac0 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Tue, 27 Aug 2024 21:05:43 +0000
Subject: [PATCH 23/42] refactor into classes

---
 tests/test_query.py              |   9 +-
 webgui.py                        |   2 +-
 webinterface/dashboards/query.py | 342 ++++++++++++++++++-------------
 3 files changed, 204 insertions(+), 149 deletions(-)

diff --git a/tests/test_query.py b/tests/test_query.py
index a9d400d0..29f06156 100644
--- a/tests/test_query.py
+++ b/tests/test_query.py
@@ -9,7 +9,7 @@
 from pydicom.uid import generate_uid
 from pydicom.dataset import Dataset, FileMetaDataset
 from rq import Worker
-from webinterface.dashboards.query import SimpleDicomClient, QueryJob, WrappedJob
+from webinterface.dashboards.query import GetAccessionsJob, SimpleDicomClient, QueryJob, WrappedJob
 from common.types import DicomNode, DicomWebNode
 from webinterface.common import redis, worker_queue
 from pyfakefs import fake_filesystem
@@ -127,13 +127,8 @@ def test_get_accession_job(dicom_server, tempdir, mercure_config):
     """Test the get_accession_job function."""
     config = mercure_config()
     job_id = "test_job"
-    job_kwargs = {
-        "accession": MOCK_ACCESSION,
-        "node": dicom_server,
-        "path": config.jobs_folder
-    }
     
-    generator = QueryJob.get_accession_job(job_id, job_kwargs)
+    generator = GetAccessionsJob.get_accession(job_id, MOCK_ACCESSION, dicom_server, config.jobs_folder)
     results = list(generator)
     
     # Check that we got some results
diff --git a/webgui.py b/webgui.py
index c9b2f421..49484c97 100755
--- a/webgui.py
+++ b/webgui.py
@@ -142,7 +142,7 @@ def startup() -> None:
         worker_scheduler.cancel(job)
     worker_scheduler.schedule(
         scheduled_time=datetime.datetime.utcnow(),
-        func=dashboards.query.update_jobs_offpeak,
+        func=dashboards.query.WrappedJob.update_all_jobs_offpeak,
         interval=60,
         meta={"type": "offpeak"},
         repeat=None
diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
index 40ea21c1..60055d4f 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query.py
@@ -1,8 +1,10 @@
 
+from dataclasses import dataclass
+import dataclasses
 import os
 from pathlib import Path
 import shutil
-from typing import Any, Dict, Generator, List, Tuple, Union, cast
+from typing import Any, Dict, Generator, List, Optional, Tuple, Union, cast
 import typing
 
 from dicomweb_client import DICOMfileClient
@@ -54,46 +56,116 @@ def query_dummy(job_id, job_kwargs):
         yield completed, remaining, f"{completed} / {remaining + completed}"
 
 class QueryJob():
-    @classmethod 
-    def get_accession_job(cls, job_id, job_kwargs) -> Generator[Tuple[int,int,str], None, str]:
-        accession, node, path = job_kwargs["accession"], job_kwargs["node"], job_kwargs["path"]
-        config.read_config()
-        c = SimpleDicomClient(node.ip, node.port, node.aet_target, path)
-        for identifier in c.getscu(accession):
-            completed, remaining = identifier.NumberOfCompletedSuboperations, identifier.NumberOfRemainingSuboperations, 
-            progress = f"{ completed } / { completed + remaining }" 
-            yield completed, remaining, progress
-        return "Complete"
+    @classmethod
+    def move_to_destination(cls, path, destination, job_id) -> None:
+        if destination is None:
+            config.read_config()
+            for p in Path(path).glob("**/*"):
+                if p.is_file():
+                    shutil.move(str(p), config.mercure.incoming_folder) # Move the file to incoming folder
+            # tree(config.mercure.incoming_folder)
+            shutil.rmtree(path)
+        else:
+            dest_folder: Path = Path(destination) / job_id
+            dest_folder.mkdir(exist_ok=True)
+            logger.info(f"moving {path} to {dest_folder}")
+            shutil.move(path, dest_folder)
+            # tree(dest_folder)
+            logger.info(f"moved")
+
+
+@dataclass
+class ClassBasedRQJob():
+    parent: Optional[str] = None
+    type: str = "unknown"
+    _job: Optional[Job] = None
+    def create(self, rq_options={}, **kwargs):
+        fields = dataclasses.fields(self)
+        meta = {field.name: getattr(self, field.name) for field in fields}
+        return Job.create(self._execute, kwargs=kwargs, meta=meta, **rq_options)
 
     @classmethod
-    def check_accessions_exist(cls, *, accessions, node, queue=worker_queue):
+    def _execute(cls, **kwargs):
+        job = get_current_job()
+        if not job:
+            raise Exception("No current job")
+        fields = dataclasses.fields(cls)
+        meta = {}
+        for f in fields:
+            if f.name in job.meta and not f.name.startswith('_'):
+                meta[f.name] = job.meta[f.name]
+        cls(**meta, _job=job).execute(**kwargs)
+
+    def execute(self):
+        pass
+
+
+@dataclass
+class CheckAccessionsDicomWebJob(ClassBasedRQJob):
+    type: str = "check_accessions_dicomweb"
+
+    def execute(self, *, accessions, node: DicomWebNode, queue=worker_queue): 
+        client = (DICOMfileClient(url=node.base_url, in_memory=True) if node.base_url.startswith("file://") 
+                  else DICOMwebClient(node.base_url))
+        assert isinstance(client, (DICOMwebClient, DICOMfileClient))
+        for accession in accessions:
+            try:
+                response = client.search_for_series(search_filters={'AccessionNumber': accession})
+                if not response:
+                    raise ValueError("No series found with accession number {}".format(accession))
+            except Exception as e:
+                job = get_current_job()
+                if not job:
+                    raise Exception("No current job found")
+                job_parent = queue.fetch_job(job.meta.get('parent'))
+                job_parent.meta['failed_reason'] = f"Accession {accession} not found on node"
+                queue._enqueue_job(job_parent,at_front=True)
+                raise
+        return "Complete"
+
+@dataclass 
+class CheckAccessionsJob(ClassBasedRQJob):
+    type: str = "check_accessions"
+
+    def execute(self, *, accessions, node, queue=worker_queue):
         """
         Check if the given accessions exist on the node using a DICOM query.
         """
         c = SimpleDicomClient(node.ip, node.port, node.aet_target, None)
+        assert self.parent is not None
         try:
             for accession in accessions:
                 result = c.findscu(accession)
                 logger.info(result)
         except:
-            job = get_current_job()
-            if not job:
-                raise Exception("No current job found")
-            job_parent = queue.fetch_job(job.meta.get('parent'))
+            job_parent = queue.fetch_job(self.parent)
             job_parent.meta['failed_reason'] = f"Accession {accession} not found on node"
             queue._enqueue_job(job_parent,at_front=True)
             raise
 
+@dataclass
+class GetAccessionsJob(ClassBasedRQJob):
+    type: str = "get_accession"
+    paused: bool = False
+    offpeak: bool = False
+
     @classmethod
-    def get_accessions(cls, *,accession, node, path, perform_func=query_dummy,queue=worker_queue):
+    def get_accession(cls, job_id, accession, node, path) -> Generator[Tuple[int,int,str], None, str]:
+        config.read_config()
+        c = SimpleDicomClient(node.ip, node.port, node.aet_target, path)
+        for identifier in c.getscu(accession):
+            completed, remaining = identifier.NumberOfCompletedSuboperations, identifier.NumberOfRemainingSuboperations, 
+            progress = f"{ completed } / { completed + remaining }" 
+            yield completed, remaining, progress
+        return "Complete"
+
+    def execute(self, *,accession, node, path, queue=worker_queue):
         print(f"Getting {accession}")
-        job = get_current_job()
-        if not job:
-            raise Exception("No current job")
+        job = self._job
         try:
             Path(path).mkdir(parents=True, exist_ok=True)
             job_parent = None
-            if parent_id := job.meta.get('parent'):
+            if parent_id := self.parent:
                 job_parent = queue.fetch_job(parent_id)
 
             if job_parent:
@@ -103,15 +175,16 @@ def get_accessions(cls, *,accession, node, path, perform_func=query_dummy,queue=
             job.meta['started'] = 1
             job.meta['progress'] = "0 / Unknown"
             job.save_meta() # type: ignore
-            for completed, remaining, progress in perform_func(job.id, job.kwargs):
+            for completed, remaining, progress in self.get_accession(job.id, accession, node, path):
                 job.meta['remaining'] = remaining
                 job.meta['completed'] = completed
                 job.meta['progress'] = progress
                 job.save_meta() # type: ignore  # Save the updated meta data to the job
                 logger.info(progress)
-            if job_parent.kwargs["move_promptly"]:
-                move_to_destination(path, job_parent.kwargs["destination"], job_parent.id)
             if job_parent:
+                if job_parent.kwargs["move_promptly"]:
+                    QueryJob.move_to_destination(path, job_parent.kwargs["destination"], job_parent.id)
+
                 job_parent.get_meta() # there is technically a race condition here...
                 job_parent.meta['completed'] += 1
                 job_parent.meta['progress'] = f"{job_parent.meta['started'] } / {job_parent.meta['completed'] } / {job_parent.meta['total']}"
@@ -135,10 +208,12 @@ def get_accessions(cls, *,accession, node, path, perform_func=query_dummy,queue=
 
         return "Job complete"
 
-class DicomWebQueryJob(QueryJob):
-    @classmethod 
-    def get_accession_job(cls, job_id, job_kwargs):
-        accession, node, path = job_kwargs["accession"], job_kwargs["node"], job_kwargs["path"]
+@dataclass
+class GetAccessionsDicomWebJob(GetAccessionsJob):
+    type: str = "get_accession_dicomweb"
+
+    @classmethod
+    def get_accession(cls, job_id, accession, node, path) -> Generator[Tuple[int,int,str], None, None]:
         config.read_config()
         client = (DICOMfileClient(url=node.base_url, in_memory=True) if node.base_url.startswith("file://") 
                   else DICOMwebClient(node.base_url))
@@ -159,82 +234,39 @@ def get_accession_job(cls, job_id, job_kwargs):
                 remaining -= 1
                 yield (n, remaining, f'{n} / {n + remaining}')
 
-    @classmethod
-    def check_accessions_exist(cls, *, accessions, node: DicomWebNode, queue=worker_queue): 
-        client = (DICOMfileClient(url=node.base_url, in_memory=True) if node.base_url.startswith("file://") 
-                  else DICOMwebClient(node.base_url))
-        assert isinstance(client, (DICOMwebClient, DICOMfileClient))
+@dataclass
+class MainJob(ClassBasedRQJob):
+    type: str = "batch" 
+    started: int = 0
+    completed: int = 0
+    total: int = 0
+    paused: bool = False 
+    offpeak: bool = False
+
+    def execute(self, *, accessions, subjobs, path, destination, move_promptly, queue=worker_queue) -> str:
+        job = self._job
+        job.get_meta()
+        for job_id in job.kwargs.get('subjobs',[]):
+            subjob = queue.fetch_job(job_id)
+            if (status := subjob.get_status()) != 'finished':
+                raise Exception(f"Subjob {subjob.id} is {status}")
+            if job.kwargs.get('failed', False):
+                raise Exception(f"Failed")
+
+        logger.info(f"Job completing {job.id}")
+
+        if not move_promptly:
+            logger.info("Moving files during completion as move_promptly==False")
+            for p in Path(path).iterdir():
+                if not p.is_dir():
+                    continue
+                cls.move_to_destination(p, destination, job.id)
+        logger.info(f"Removing job directory {path}")
+        # tree(destination)
+        shutil.rmtree(path)
 
-        for accession in accessions:
-            try:
-                response = client.search_for_series(search_filters={'AccessionNumber': accession})
-                if not response:
-                    print(client.search_for_series())
-                    raise ValueError("No series found with accession number {}".format(accession))
-            except Exception as e:
-                job = get_current_job()
-                if not job:
-                    raise Exception("No current job found")
-                job_parent = queue.fetch_job(job.meta.get('parent'))
-                job_parent.meta['failed_reason'] = f"Accession {accession} not found on node"
-                queue._enqueue_job(job_parent,at_front=True)
-                raise
-        return "Complete"
+        return "Job complete"
 
-# def tree(path, prefix='', level=0) -> None:
-#     if level==0:
-#         logger.info(path)
-#     entries = list(os.listdir(path))
-#     entries = sorted(entries, key=lambda e: (e.is_file(), e.name))
-#     if not entries and level==0:
-#         logger.info(prefix + "[[ empty ]]")
-#     for i, entry in enumerate(entries):
-#         conn = '└── ' if i == len(entries) - 1 else '├── '
-#         logger.info(f'{prefix}{conn}{entry.name}')
-#         if entry.is_dir():
-#             tree(entry.path, prefix + ('    ' if i == len(entries) - 1 else '│   '), level+1)
-
-def move_to_destination(path, destination, job_id) -> None:
-    if destination is None:
-        config.read_config()
-        for p in Path(path).glob("**/*"):
-            if p.is_file():
-                shutil.move(str(p), config.mercure.incoming_folder) # Move the file to incoming folder
-        # tree(config.mercure.incoming_folder)
-        shutil.rmtree(path)
-    else:
-        dest_folder: Path = Path(destination) / job_id
-        dest_folder.mkdir(exist_ok=True)
-        logger.info(f"moving {path} to {dest_folder}")
-        shutil.move(path, dest_folder)
-        # tree(dest_folder)
-        logger.info(f"moved")
-
-def batch_job(*, accessions, subjobs, path, destination, move_promptly, queue=worker_queue) -> str:
-    job = get_current_job()
-    if not job:
-        raise Exception("No current job")
-    job.get_meta()
-    for job_id in job.kwargs.get('subjobs',[]):
-        subjob = queue.fetch_job(job_id)
-        if (status := subjob.get_status()) != 'finished':
-            raise Exception(f"Subjob {subjob.id} is {status}")
-        if job.kwargs.get('failed', False):
-            raise Exception(f"Failed")
-
-    logger.info(f"Job completing {job.id}")
-
-    if not move_promptly:
-        logger.info("Moving files during completion as move_promptly==False")
-        for p in Path(path).iterdir():
-            if not p.is_dir():
-                continue
-            move_to_destination(p, destination, job.id)
-    logger.info(f"Removing job directory {path}")
-    # tree(destination)
-    shutil.rmtree(path)
-
-    return "Job complete"
 
 def monitor_job():
     print("monitoring")
@@ -245,6 +277,7 @@ def __init__(self, job: Union[Job,str], queue):
             self.job = queue.fetch_job(job)
         else:
             self.job = job
+        assert self.job.meta.get('type') == 'batch', f"Job type must be batch, got {self.job.meta['type']}"
         self.queue = queue
 
     @classmethod
@@ -253,33 +286,51 @@ def create(cls, accessions, dicom_node: DicomNodeBase, destination_path, offpeak
         Create a job to process the given accessions and store them in the specified destination path.
         """
         if isinstance(dicom_node, DicomNode):
-            JobClass = QueryJob 
+            CheckJob = CheckAccessionsJob
+            GetJob = GetAccessionsJob
         elif isinstance(dicom_node, DicomWebNode):
-            JobClass = DicomWebQueryJob
+            CheckJob = CheckAccessionsDicomWebJob
+            GetJob = GetAccessionsDicomWebJob
+        #     JobClass = DicomWebQueryJob
 
         with Connection(redis):
             jobs: List[Job] = []
-            check_job = Job.create(JobClass.check_accessions_exist, kwargs=dict(accessions=accessions,node=dicom_node), meta=dict(parent=None))
-
+            check_job = CheckJob().create(accessions=accessions, node=dicom_node)
             for accession in accessions:
-                job = Job.create(JobClass.get_accessions, 
-                                kwargs=dict(perform_func=JobClass.get_accession_job, accession=accession, node=dicom_node), timeout=30*60, result_ttl=-1, 
-                                meta=dict(type="get_accession_batch",parent=None, paused=False, offpeak=offpeak),
-                                depends_on=cast(List[Union[Dependency, Job]],[check_job])
-                                )
+                job = GetJob(offpeak=offpeak).create(
+                    accession=accession, 
+                    node=dicom_node,
+                    rq_options=dict(
+                        depends_on=cast(List[Union[Dependency, Job]],[check_job]),
+                        timeout=30*60,
+                        result_ttl=-1
+                        )
+                    )
                 jobs.append(job)
             depends = Dependency(
                 jobs=cast(List[Union[Job,str]],jobs),
                 allow_failure=True,    # allow_failure defaults to False
             )
-            full_job = Job.create(batch_job, 
-                                  kwargs=dict(accessions=accessions, 
-                                              subjobs=[j.id for j in jobs],
-                                              destination=destination_path, 
-                                              move_promptly=True), 
-                                  meta=dict(type="batch", started=0, paused=False,completed=0, total=len(jobs), offpeak=offpeak),
-                                  depends_on=depends,
-                                  timeout=-1, result_ttl=-1)
+            full_job = MainJob(total=len(jobs), offpeak=offpeak).create(
+                accessions = accessions,
+                subjobs = [j.id for j in jobs],
+                destination = destination_path,
+                move_promptly = True,
+                rq_options = dict(depends_on=depends, timeout=-1, result_ttl=-1)
+            )
+            # full_job = Job.create(JobClass.batch_job, 
+            #                       kwargs=dict(accessions=accessions, 
+            #                                   subjobs=[j.id for j in jobs],
+            #                                   destination=destination_path, 
+            #                                   move_promptly=True), 
+            #                       meta=dict(type="batch", 
+            #                                 started=0,
+            #                                 paused=False, 
+            #                                 completed=0,
+            #                                 total=len(jobs),
+            #                                 offpeak=offpeak),
+            #                       depends_on=depends,
+            #                       timeout=-1, result_ttl=-1)
             check_job.meta["parent"] = full_job.id
             for j in jobs:
                 j.meta["parent"] = full_job.id
@@ -346,6 +397,33 @@ def retry(self) -> None:
                 self.queue.enqueue_job(subjob)
         self.queue.enqueue_job(self.job)
 
+    @classmethod
+    def update_all_jobs_offpeak(cls,queue=worker_queue) -> None:
+        """
+        Resume or pause offpeak jobs based on whether the current time is within offpeak hours.
+        """
+        config.read_config()
+        is_offpeak = _is_offpeak(config.mercure.offpeak_start, config.mercure.offpeak_end, datetime.now().time())
+        logger.info(f"is_offpeak {is_offpeak}")
+        for job in WrappedJob.get_all_jobs(queue=queue):
+            job.update_offpeak(is_offpeak)
+
+    def update_offpeak(self, is_offpeak) -> None:
+        if not self.meta.get("offpeak"):
+            return
+        if self.get_status() not in ("waiting", "running", "queued", "deferred"):
+            return
+
+        if is_offpeak:
+            # logger.info(f"{job.meta}, {job.get_status()}")
+            if self.is_paused:
+                logger.info("Resuming")
+                self.resume()
+        else:
+            if not self.is_paused:
+                logger.info("Pausing")
+                self.pause()
+
     def get_subjobs(self) -> Generator[Job, None, None]:
         return (self.queue.fetch_job(job) for job in self.job.kwargs.get('subjobs', []) if job)
 
@@ -367,6 +445,10 @@ def is_failed(self) -> bool:
     def is_finished(self) -> bool:
         return cast(bool,self.job.is_finished)
     
+    @property
+    def is_paused(self) -> bool:
+        return cast(bool,self.meta.get("paused",False))
+
     @property
     def id(self) -> str:
         return cast(str,self.job.id)
@@ -423,28 +505,6 @@ def _is_offpeak(offpeak_start: str, offpeak_end: str, current_time) -> bool:
     # End time is after midnight
     return bool(current_time >= start_time or current_time <= end_time)
 
-def update_jobs_offpeak(queue=worker_queue):
-    """
-    Resume or pause offpeak jobs based on whether the current time is within offpeak hours.
-    """
-    config.read_config()
-    is_offpeak = _is_offpeak(config.mercure.offpeak_start, config.mercure.offpeak_end, datetime.now().time())
-    logger.info(f"is_offpeak {is_offpeak}")
-    for job in WrappedJob.get_all_jobs(queue=queue):
-        if not job.meta.get("offpeak"):
-            continue
-        if job.get_status() not in ("waiting", "running", "queued", "deferred"):
-            continue
-
-        if is_offpeak:
-            logger.info(f"{job.meta}, {job.get_status()}")
-            if job.meta.get("paused", False):
-                logger.info("Resuming")
-                job.resume()
-        else:
-            if not job.meta.get("paused", False):
-                logger.info("Pausing")
-                job.pause()
  
 @router.post("/query/retry_job")
 @requires(["authenticated", "admin"], redirect="login")

From 2aa2800d2b6032c5010f0507c38fd1730a7e8584 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Tue, 27 Aug 2024 21:15:15 +0000
Subject: [PATCH 24/42] refactor

---
 tests/test_query.py              |  2 +-
 webinterface/dashboards/query.py | 64 +++++++++++++-------------------
 2 files changed, 26 insertions(+), 40 deletions(-)

diff --git a/tests/test_query.py b/tests/test_query.py
index 29f06156..97ef5abf 100644
--- a/tests/test_query.py
+++ b/tests/test_query.py
@@ -9,7 +9,7 @@
 from pydicom.uid import generate_uid
 from pydicom.dataset import Dataset, FileMetaDataset
 from rq import Worker
-from webinterface.dashboards.query import GetAccessionsJob, SimpleDicomClient, QueryJob, WrappedJob
+from webinterface.dashboards.query import GetAccessionsJob, SimpleDicomClient, WrappedJob
 from common.types import DicomNode, DicomWebNode
 from webinterface.common import redis, worker_queue
 from pyfakefs import fake_filesystem
diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
index 60055d4f..dad0f279 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query.py
@@ -55,37 +55,19 @@ def query_dummy(job_id, job_kwargs):
 
         yield completed, remaining, f"{completed} / {remaining + completed}"
 
-class QueryJob():
-    @classmethod
-    def move_to_destination(cls, path, destination, job_id) -> None:
-        if destination is None:
-            config.read_config()
-            for p in Path(path).glob("**/*"):
-                if p.is_file():
-                    shutil.move(str(p), config.mercure.incoming_folder) # Move the file to incoming folder
-            # tree(config.mercure.incoming_folder)
-            shutil.rmtree(path)
-        else:
-            dest_folder: Path = Path(destination) / job_id
-            dest_folder.mkdir(exist_ok=True)
-            logger.info(f"moving {path} to {dest_folder}")
-            shutil.move(path, dest_folder)
-            # tree(dest_folder)
-            logger.info(f"moved")
-
 
 @dataclass
 class ClassBasedRQJob():
     parent: Optional[str] = None
     type: str = "unknown"
     _job: Optional[Job] = None
-    def create(self, rq_options={}, **kwargs):
+    def create(self, rq_options={}, **kwargs) -> Job:
         fields = dataclasses.fields(self)
         meta = {field.name: getattr(self, field.name) for field in fields}
         return Job.create(self._execute, kwargs=kwargs, meta=meta, **rq_options)
 
     @classmethod
-    def _execute(cls, **kwargs):
+    def _execute(cls, **kwargs) -> Any:
         job = get_current_job()
         if not job:
             raise Exception("No current job")
@@ -94,10 +76,28 @@ def _execute(cls, **kwargs):
         for f in fields:
             if f.name in job.meta and not f.name.startswith('_'):
                 meta[f.name] = job.meta[f.name]
-        cls(**meta, _job=job).execute(**kwargs)
+        result = cls(**meta, _job=job).execute(**kwargs)
+        return result
 
     def execute(self):
         pass
+    
+    @staticmethod
+    def move_to_destination(path, destination, job_id) -> None:
+        if destination is None:
+            config.read_config()
+            for p in Path(path).glob("**/*"):
+                if p.is_file():
+                    shutil.move(str(p), config.mercure.incoming_folder) # Move the file to incoming folder
+            # tree(config.mercure.incoming_folder)
+            shutil.rmtree(path)
+        else:
+            dest_folder: Path = Path(destination) / job_id
+            dest_folder.mkdir(exist_ok=True)
+            logger.info(f"moving {path} to {dest_folder}")
+            shutil.move(path, dest_folder)
+            # tree(dest_folder)
+            logger.info(f"moved")
 
 
 @dataclass
@@ -114,11 +114,10 @@ def execute(self, *, accessions, node: DicomWebNode, queue=worker_queue):
                 if not response:
                     raise ValueError("No series found with accession number {}".format(accession))
             except Exception as e:
-                job = get_current_job()
-                if not job:
-                    raise Exception("No current job found")
+                job = self._job
                 job_parent = queue.fetch_job(job.meta.get('parent'))
                 job_parent.meta['failed_reason'] = f"Accession {accession} not found on node"
+                job_parent.save_meta()
                 queue._enqueue_job(job_parent,at_front=True)
                 raise
         return "Complete"
@@ -183,7 +182,7 @@ def execute(self, *,accession, node, path, queue=worker_queue):
                 logger.info(progress)
             if job_parent:
                 if job_parent.kwargs["move_promptly"]:
-                    QueryJob.move_to_destination(path, job_parent.kwargs["destination"], job_parent.id)
+                    self.move_to_destination(path, job_parent.kwargs["destination"], job_parent.id)
 
                 job_parent.get_meta() # there is technically a race condition here...
                 job_parent.meta['completed'] += 1
@@ -260,7 +259,7 @@ def execute(self, *, accessions, subjobs, path, destination, move_promptly, queu
             for p in Path(path).iterdir():
                 if not p.is_dir():
                     continue
-                cls.move_to_destination(p, destination, job.id)
+                self.move_to_destination(p, destination, job.id)
         logger.info(f"Removing job directory {path}")
         # tree(destination)
         shutil.rmtree(path)
@@ -318,19 +317,6 @@ def create(cls, accessions, dicom_node: DicomNodeBase, destination_path, offpeak
                 move_promptly = True,
                 rq_options = dict(depends_on=depends, timeout=-1, result_ttl=-1)
             )
-            # full_job = Job.create(JobClass.batch_job, 
-            #                       kwargs=dict(accessions=accessions, 
-            #                                   subjobs=[j.id for j in jobs],
-            #                                   destination=destination_path, 
-            #                                   move_promptly=True), 
-            #                       meta=dict(type="batch", 
-            #                                 started=0,
-            #                                 paused=False, 
-            #                                 completed=0,
-            #                                 total=len(jobs),
-            #                                 offpeak=offpeak),
-            #                       depends_on=depends,
-            #                       timeout=-1, result_ttl=-1)
             check_job.meta["parent"] = full_job.id
             for j in jobs:
                 j.meta["parent"] = full_job.id

From 28fc35eb423b0c9abfb90c509b0cc76c66d8aff8 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Tue, 27 Aug 2024 21:33:29 +0000
Subject: [PATCH 25/42] refactor

---
 tests/test_query.py              | 32 +++++++++++++++++++++++---------
 webinterface/dashboards/query.py | 24 +++++++++++++++---------
 2 files changed, 38 insertions(+), 18 deletions(-)

diff --git a/tests/test_query.py b/tests/test_query.py
index 97ef5abf..9bb8a269 100644
--- a/tests/test_query.py
+++ b/tests/test_query.py
@@ -9,7 +9,7 @@
 from pydicom.uid import generate_uid
 from pydicom.dataset import Dataset, FileMetaDataset
 from rq import Worker
-from webinterface.dashboards.query import GetAccessionsJob, SimpleDicomClient, WrappedJob
+from webinterface.dashboards.query import GetAccessionJob, GetAccessionDicomWebJob, SimpleDicomClient, WrappedJob
 from common.types import DicomNode, DicomWebNode
 from webinterface.common import redis, worker_queue
 from pyfakefs import fake_filesystem
@@ -110,6 +110,20 @@ def dicom_server(mock_node, dummy_dataset):
     yield mock_node
     server.stop()
 
+@pytest.fixture(scope="function")
+def dicomweb_server(dummy_dataset, tempdir):
+    ds = dummy_dataset.copy()
+    ds.SOPClassUID = CTImageStorage  # CT Image Storage
+    ds.SOPInstanceUID = generate_uid()
+    ds.StudyInstanceUID = generate_uid()
+    ds.file_meta = FileMetaDataset()
+    ds.file_meta.TransferSyntaxUID = ExplicitVRLittleEndian
+    
+    (tempdir / "dicomweb").mkdir()
+    ds.save_as(tempdir / "dicomweb" / "dummy.dcm", write_like_original=False)
+
+    yield DicomWebNode(name="dicomweb_dummy", base_url=f"file://{tempdir}/dicomweb")
+
 def test_simple_dicom_client(dicom_server):
     """Test the SimpleDicomClient can connect to and query the DICOM server."""
     client = SimpleDicomClient(dicom_server.ip, dicom_server.port, dicom_server.aet_target, None)
@@ -123,18 +137,18 @@ def tempdir():
     with tempfile.TemporaryDirectory(prefix="mercure_temp") as d:
         yield Path(d)
 
-def test_get_accession_job(dicom_server, tempdir, mercure_config):
+def test_get_accession_job(dicom_server, dicomweb_server, mercure_config):
     """Test the get_accession_job function."""
     config = mercure_config()
     job_id = "test_job"
     
-    generator = GetAccessionsJob.get_accession(job_id, MOCK_ACCESSION, dicom_server, config.jobs_folder)
-    results = list(generator)
-    
-    # Check that we got some results
-    assert len(results) > 0
-    assert results[0][1] == 0
-    assert pydicom.dcmread(next(k for k in Path(config.jobs_folder).iterdir()))['AccessionNumber'].value == MOCK_ACCESSION
+    for server,job in ((dicom_server, GetAccessionJob), (dicomweb_server, GetAccessionDicomWebJob)):
+        generator = job.get_accession(job_id, MOCK_ACCESSION, server, config.jobs_folder)
+        results = list(generator)
+        # Check that we got some results
+        assert len(results) > 0
+        assert results[0][1] == 0
+        assert pydicom.dcmread(next(k for k in Path(config.jobs_folder).iterdir()))['AccessionNumber'].value == MOCK_ACCESSION
 
 def test_query_job(dicom_server, tempdir):
     """
diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
index dad0f279..3d331b55 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query.py
@@ -143,7 +143,7 @@ def execute(self, *, accessions, node, queue=worker_queue):
             raise
 
 @dataclass
-class GetAccessionsJob(ClassBasedRQJob):
+class GetAccessionJob(ClassBasedRQJob):
     type: str = "get_accession"
     paused: bool = False
     offpeak: bool = False
@@ -208,12 +208,13 @@ def execute(self, *,accession, node, path, queue=worker_queue):
         return "Job complete"
 
 @dataclass
-class GetAccessionsDicomWebJob(GetAccessionsJob):
+class GetAccessionDicomWebJob(GetAccessionJob):
     type: str = "get_accession_dicomweb"
 
     @classmethod
     def get_accession(cls, job_id, accession, node, path) -> Generator[Tuple[int,int,str], None, None]:
         config.read_config()
+        assert isinstance(node, DicomWebNode), f"Invalid node type {type(node)}: expected DicomWebNode"
         client = (DICOMfileClient(url=node.base_url, in_memory=True) if node.base_url.startswith("file://") 
                   else DICOMwebClient(node.base_url))
         assert isinstance(client, (DICOMwebClient, DICOMfileClient))
@@ -270,6 +271,14 @@ def execute(self, *, accessions, subjobs, path, destination, move_promptly, queu
 def monitor_job():
     print("monitoring")
 
+class DicomQueryFlow():
+    CheckAccessions = CheckAccessionsJob
+    GetAccession = GetAccessionJob
+
+class DicomWebQueryFlow():
+    CheckAccessions = CheckAccessionsDicomWebJob
+    GetAccession = GetAccessionDicomWebJob
+
 class WrappedJob():
     def __init__(self, job: Union[Job,str], queue):
         if isinstance(job, str):
@@ -285,18 +294,15 @@ def create(cls, accessions, dicom_node: DicomNodeBase, destination_path, offpeak
         Create a job to process the given accessions and store them in the specified destination path.
         """
         if isinstance(dicom_node, DicomNode):
-            CheckJob = CheckAccessionsJob
-            GetJob = GetAccessionsJob
+            DicomFlow = DicomQueryFlow
         elif isinstance(dicom_node, DicomWebNode):
-            CheckJob = CheckAccessionsDicomWebJob
-            GetJob = GetAccessionsDicomWebJob
-        #     JobClass = DicomWebQueryJob
+            DicomFlow = DicomWebQueryFlow
 
         with Connection(redis):
             jobs: List[Job] = []
-            check_job = CheckJob().create(accessions=accessions, node=dicom_node)
+            check_job = DicomFlow.CheckAccessions().create(accessions=accessions, node=dicom_node)
             for accession in accessions:
-                job = GetJob(offpeak=offpeak).create(
+                job = DicomFlow.GetAccession(offpeak=offpeak).create(
                     accession=accession, 
                     node=dicom_node,
                     rq_options=dict(

From 35707300982e2d25b8525c92fdc83a51c3e6788b Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Wed, 28 Aug 2024 22:37:25 +0000
Subject: [PATCH 26/42] initial work on refactor to use existing DicomTargets

---
 common/types.py                              |  33 +--
 dispatch/target_types/base.py                |  16 +-
 dispatch/target_types/builtin.py             |  20 +-
 dispatch/target_types/dicomweb.py            |  30 ++-
 tests/test_query.py                          |  48 ++--
 webinterface/dashboards/query.py             | 228 ++++++++++---------
 webinterface/query.py                        |   2 +-
 webinterface/templates/dashboards/query.html |   4 +-
 8 files changed, 212 insertions(+), 169 deletions(-)

diff --git a/common/types.py b/common/types.py
index ac5cd68e..f200c931 100755
--- a/common/types.py
+++ b/common/types.py
@@ -22,6 +22,7 @@ class EmptyDict(TypedDict):
     pass
 
 class Target(BaseModel, Compat):
+    target_type: Any
     contact: Optional[str] = ""
     comment: str = ""
 
@@ -98,12 +99,12 @@ class XnatTarget(Target):
 class DicomWebTarget(Target):
     target_type: Literal["dicomweb"] = "dicomweb"
     url: str
-    qido_url_prefix: Optional[str]
-    wado_url_prefix: Optional[str]
-    stow_url_prefix: Optional[str]
-    access_token: Optional[str]
-    http_user: Optional[str]
-    http_password: Optional[str]
+    qido_url_prefix: Optional[str] = None
+    wado_url_prefix: Optional[str] = None
+    stow_url_prefix: Optional[str] = None
+    access_token: Optional[str] = None
+    http_user: Optional[str] = None
+    http_password: Optional[str] = None
 
 
 class S3Target(Target):
@@ -203,26 +204,6 @@ def validate(cls, v):
     def get_name(cls) -> str:
         return cls.construct().node_type  # type: ignore
 
-
-class DicomNode(DicomNodeBase):
-    node_type: Literal["dicom"] = "dicom"
-    name: str
-    ip: str
-    port: int
-    aet_target: str
-    aet_source: Optional[str] = ""
-
-class DicomWebNode(DicomNodeBase):
-    node_type: Literal["dicomweb"] = "dicomweb"
-    name: str
-    base_url: str
-
-    qido_url_prefix: Optional[str] = None
-    wado_url_prefix: Optional[str] = None
-    access_token: Optional[str] = None
-    ca_bundle: Optional[str] = None
-    cert: Optional[str] = None
-
 class DicomDestination(BaseModel):
     name: str
     path: str
diff --git a/dispatch/target_types/base.py b/dispatch/target_types/base.py
index 4c670b25..19807890 100644
--- a/dispatch/target_types/base.py
+++ b/dispatch/target_types/base.py
@@ -1,8 +1,9 @@
+from dataclasses import dataclass
 from common.types import Task, TaskDispatch, TaskInfo, Rule, Target
 import common.config as config
 from subprocess import CalledProcessError, check_output
 from starlette.responses import JSONResponse
-from typing import Any, TypeVar, Generic, cast
+from typing import Any, Generator, TypeVar, Generic, cast
 
 from pathlib import Path
 import subprocess
@@ -12,6 +13,12 @@
 TargetTypeVar = TypeVar("TargetTypeVar")
 
 
+@dataclass
+class ProgressInfo():
+    completed: int = 0
+    remaining: int = 0
+    progress: str = ""
+
 class TargetHandler(Generic[TargetTypeVar]):
     test_template = "targets/base-test.html"
 
@@ -28,6 +35,12 @@ def send_to_target(
     ) -> str:
         return ""
 
+    def get_from_target(self, target: TargetTypeVar, accession: str, path:str) -> Generator[ProgressInfo, None, None]:
+        raise Exception()
+
+    def find_from_target(self, target: TargetTypeVar, accession: str) -> bool:
+        raise Exception()
+
     def handle_error(self, e, command) -> None:
         pass
 
@@ -69,6 +82,7 @@ def send_to_target(
                 raise
         return result
 
+
     def handle_error(self, e: CalledProcessError, command) -> None:
         logger.error(e.output)
         logger.error(f"Failed. Command exited with value {e.returncode}: \n {command}")
diff --git a/dispatch/target_types/builtin.py b/dispatch/target_types/builtin.py
index 398aec70..96a00fed 100644
--- a/dispatch/target_types/builtin.py
+++ b/dispatch/target_types/builtin.py
@@ -1,3 +1,6 @@
+from typing import Generator, Optional
+
+from pydicom import Dataset
 from common.types import DicomTarget, DicomTLSTarget, SftpTarget, DummyTarget, Task
 import common.config as config
 from common.constants import mercure_names
@@ -10,8 +13,10 @@
 
 from starlette.responses import JSONResponse
 
+from webinterface.query import SimpleDicomClient
+
 from .registry import handler_for
-from .base import SubprocessTargetHandler, TargetHandler
+from .base import ProgressInfo, SubprocessTargetHandler, TargetHandler
 
 DCMSEND_ERROR_CODES = {
     1: "EXITCODE_COMMANDLINE_SYNTAX_ERROR",
@@ -54,6 +59,19 @@ def _create_command(self, target: DicomTarget, source_folder: Path, task: Task):
         )
         return command, {}
 
+    def find_from_target(self, target: DicomTarget, accession: str) -> Optional[Dataset]:
+        c = SimpleDicomClient(target.ip, target.port, target.aet_target, None)
+        return c.findscu(accession)
+        raise NotImplementedError("DicomTarget does not support find_from_target.")
+
+    def get_from_target(self, target: DicomTarget, accession, path) -> Generator[ProgressInfo, None, None]:
+        config.read_config()
+        c = SimpleDicomClient(target.ip, target.port, target.aet_target, path)
+        for identifier in c.getscu(accession):
+            completed, remaining = identifier.NumberOfCompletedSuboperations, identifier.NumberOfRemainingSuboperations, 
+            progress = f"{ completed } / { completed + remaining }" 
+            yield ProgressInfo(completed, remaining, progress)
+
     def handle_error(self, e, command):
         dcmsend_error_message = DCMSEND_ERROR_CODES.get(e.returncode, None)
         logger.exception(f"Failed command:\n {command} \nbecause of {dcmsend_error_message}")
diff --git a/dispatch/target_types/dicomweb.py b/dispatch/target_types/dicomweb.py
index 2053e7e9..c1bf2d18 100644
--- a/dispatch/target_types/dicomweb.py
+++ b/dispatch/target_types/dicomweb.py
@@ -1,9 +1,11 @@
 from pathlib import Path
+from typing import Dict, Generator, List
+from dicomweb_client import DICOMfileClient
 from requests.exceptions import HTTPError
 
 import pydicom
 from common.types import DicomWebTarget, TaskDispatch, Task
-from .base import TargetHandler
+from .base import ProgressInfo, TargetHandler
 from .registry import handler_for
 
 from dicomweb_client.api import DICOMwebClient
@@ -26,6 +28,9 @@ class DicomWebTargetHandler(TargetHandler[DicomWebTarget]):
     def create_client(self, target: DicomWebTarget):
         session = None
         headers = None
+        if target.url.startswith("file://"):
+            return DICOMfileClient(url=target.url, in_memory=True)
+          
         if target.http_user and target.http_password:
             session = create_session_from_user_pass(username=target.http_user, password=target.http_password)
         elif target.access_token:
@@ -41,6 +46,29 @@ def create_client(self, target: DicomWebTarget):
         )
         return client
 
+    def find_from_target(self, target: DicomWebTarget, accession: str) -> List[Dict[str,dict]]:
+        client = self.create_client(target)
+        return client.search_for_series(search_filters={'AccessionNumber': accession})
+
+
+    def get_from_target(self, target: DicomWebTarget, accession, path) -> Generator[ProgressInfo, None, None]:
+        client = self.create_client(target)
+        series = client.search_for_series(search_filters={'AccessionNumber': accession})
+        if not series:
+            raise ValueError("No series found with accession number {}".format(accession))
+        n = 0
+        remaining = 0
+        for s in series:
+            instances = client.retrieve_series(s['0020000D']['Value'][0], s['0020000E']['Value'][0])
+            remaining += len(instances)
+            for instance in instances:
+                sop_instance_uid = instance.get('SOPInstanceUID')
+                filename = f"{path}/{sop_instance_uid}.dcm"
+                instance.save_as(filename)
+                n += 1
+                remaining -= 1
+                yield ProgressInfo(n, remaining, f'{n} / {n + remaining}')
+
     def send_to_target(
         self, task_id: str, target: DicomWebTarget, dispatch_info: TaskDispatch, source_folder: Path, task: Task
     ) -> str:
diff --git a/tests/test_query.py b/tests/test_query.py
index 9bb8a269..dc30e71d 100644
--- a/tests/test_query.py
+++ b/tests/test_query.py
@@ -9,10 +9,9 @@
 from pydicom.uid import generate_uid
 from pydicom.dataset import Dataset, FileMetaDataset
 from rq import Worker
-from webinterface.dashboards.query import GetAccessionJob, GetAccessionDicomWebJob, SimpleDicomClient, WrappedJob
-from common.types import DicomNode, DicomWebNode
+from webinterface.dashboards.query import GetAccessionJob, SimpleDicomClient, WrappedJob
+from common.types import DicomTarget, DicomWebTarget
 from webinterface.common import redis, worker_queue
-from pyfakefs import fake_filesystem
 
 from pydicom.uid import ExplicitVRLittleEndian, ImplicitVRLittleEndian
 from testing_common import receiver_port, mercure_config
@@ -26,11 +25,13 @@
 
 @pytest.fixture(scope="module")
 def mock_node(receiver_port):
-    return DicomNode(name="TestNode", ip="127.0.0.1", port=receiver_port, aet_target="TEST")
+    return DicomTarget(ip="127.0.0.1", port=str(receiver_port), aet_target="TEST")
 
 class DummyDICOMServer:
     """A simple DICOM server for testing purposes."""
-    def __init__(self, port, dataset:Dataset):
+    def __init__(self, port:int, dataset:Dataset):
+        assert isinstance(port, int), "Port must be an integer"
+        assert isinstance(dataset, Dataset), "Dataset must be a pydicom Dataset"
         self.ae = AE()
         # Add support for DICOM verification
         self.ae.add_supported_context(Verification)
@@ -106,7 +107,7 @@ def dicom_server(mock_node, dummy_dataset):
     Pytest fixture to start a DICOM server before tests and stop it after.
     This fixture has module scope, so the server will be started once for all tests in the module.
     """
-    server = DummyDICOMServer(mock_node.port, dummy_dataset)
+    server = DummyDICOMServer(int(mock_node.port), dummy_dataset)
     yield mock_node
     server.stop()
 
@@ -122,7 +123,7 @@ def dicomweb_server(dummy_dataset, tempdir):
     (tempdir / "dicomweb").mkdir()
     ds.save_as(tempdir / "dicomweb" / "dummy.dcm", write_like_original=False)
 
-    yield DicomWebNode(name="dicomweb_dummy", base_url=f"file://{tempdir}/dicomweb")
+    yield DicomWebTarget(url=f"file://{tempdir}/dicomweb")
 
 def test_simple_dicom_client(dicom_server):
     """Test the SimpleDicomClient can connect to and query the DICOM server."""
@@ -142,12 +143,12 @@ def test_get_accession_job(dicom_server, dicomweb_server, mercure_config):
     config = mercure_config()
     job_id = "test_job"
     
-    for server,job in ((dicom_server, GetAccessionJob), (dicomweb_server, GetAccessionDicomWebJob)):
-        generator = job.get_accession(job_id, MOCK_ACCESSION, server, config.jobs_folder)
+    for server,job in ((dicom_server, GetAccessionJob), (dicomweb_server, GetAccessionJob)):
+        generator = GetAccessionJob.get_accession(job_id, MOCK_ACCESSION, server, config.jobs_folder)
         results = list(generator)
         # Check that we got some results
         assert len(results) > 0
-        assert results[0][1] == 0
+        assert results[0].remaining == 0
         assert pydicom.dcmread(next(k for k in Path(config.jobs_folder).iterdir()))['AccessionNumber'].value == MOCK_ACCESSION
 
 def test_query_job(dicom_server, tempdir):
@@ -177,27 +178,16 @@ def tree(path, prefix='', level=0) -> None:
         if entry.is_dir():
             tree(entry.path, prefix + ('    ' if i == len(entries) - 1 else '│   '), level+1)
 
-def test_query_dicomweb(receiver_port, tempdir, dummy_dataset, fs):
-    assert isinstance(os, fake_filesystem.FakeOsModule)
-    ds = dummy_dataset.copy()
-    ds.SOPClassUID = CTImageStorage  # CT Image Storage
-    ds.SOPInstanceUID = generate_uid()
-    ds.StudyInstanceUID = generate_uid()
-    ds.file_meta = FileMetaDataset()
-    ds.file_meta.TransferSyntaxUID = ExplicitVRLittleEndian
-    
-    (tempdir / "dicomweb").mkdir()
-    ds.save_as(tempdir / "dicomweb" / "dummy.dcm", write_like_original=False)
-
-    node = DicomWebNode(name="dummy", base_url=f"file://{tempdir}/dicomweb")
+def test_query_dicomweb(dicomweb_server, tempdir, dummy_dataset, fs):
     (tempdir / "outdir").mkdir()
-
-
     queue = Queue(connection=redis)
-    job = WrappedJob.create([MOCK_ACCESSION], node, (tempdir / "outdir"), queue=queue)
-    assert job is not None
+    wrapped_job = WrappedJob.create([MOCK_ACCESSION], dicomweb_server, (tempdir / "outdir"), queue=queue)
+    assert wrapped_job
     w = SimpleWorker([queue], connection=redis)
     w.work(burst=True)
     # tree(tempdir / "outdir")
-    outfile = (tempdir / "outdir" / job.id / ds.AccessionNumber /  f"{ds.SOPInstanceUID}.dcm")
-    assert outfile.exists()
\ No newline at end of file
+    outfile = (tempdir / "outdir" / wrapped_job.id / dummy_dataset.AccessionNumber /  f"{dummy_dataset.SOPInstanceUID}.dcm")
+    assert outfile.exists(), f"File {outfile} does not exist."
+    wrapped_job.get_meta()
+    assert wrapped_job.meta['completed'] == 1
+    assert wrapped_job.meta['total'] == 1
\ No newline at end of file
diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
index 3d331b55..4e56692b 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query.py
@@ -4,11 +4,14 @@
 import os
 from pathlib import Path
 import shutil
-from typing import Any, Dict, Generator, List, Optional, Tuple, Union, cast
+from typing import Any, Dict, Generator, List, Optional, Tuple, Type, Union, cast
 import typing
+from typing_extensions import Literal
 
 from dicomweb_client import DICOMfileClient
-from common.types import DicomNode, DicomNodeBase, DicomWebNode
+from common.types import DicomTarget, DicomWebTarget, FolderTarget
+from dispatch.target_types.base import ProgressInfo
+from dispatch.target_types.registry import get_handler
 from webinterface.query import SimpleDicomClient
 # Standard python includes
 from datetime import datetime
@@ -79,7 +82,7 @@ def _execute(cls, **kwargs) -> Any:
         result = cls(**meta, _job=job).execute(**kwargs)
         return result
 
-    def execute(self):
+    def execute(self, *args, **kwargs) -> Any:
         pass
     
     @staticmethod
@@ -100,27 +103,27 @@ def move_to_destination(path, destination, job_id) -> None:
             logger.info(f"moved")
 
 
-@dataclass
-class CheckAccessionsDicomWebJob(ClassBasedRQJob):
-    type: str = "check_accessions_dicomweb"
-
-    def execute(self, *, accessions, node: DicomWebNode, queue=worker_queue): 
-        client = (DICOMfileClient(url=node.base_url, in_memory=True) if node.base_url.startswith("file://") 
-                  else DICOMwebClient(node.base_url))
-        assert isinstance(client, (DICOMwebClient, DICOMfileClient))
-        for accession in accessions:
-            try:
-                response = client.search_for_series(search_filters={'AccessionNumber': accession})
-                if not response:
-                    raise ValueError("No series found with accession number {}".format(accession))
-            except Exception as e:
-                job = self._job
-                job_parent = queue.fetch_job(job.meta.get('parent'))
-                job_parent.meta['failed_reason'] = f"Accession {accession} not found on node"
-                job_parent.save_meta()
-                queue._enqueue_job(job_parent,at_front=True)
-                raise
-        return "Complete"
+# @dataclass
+# class CheckAccessionsDicomWebJob(ClassBasedRQJob):
+#     type: str = "check_accessions_dicomweb"
+
+#     def execute(self, *, accessions, node: DicomWebTarget, queue=worker_queue): 
+#         client = (DICOMfileClient(url=node.url, in_memory=True) if node.url.startswith("file://") 
+#                   else DICOMwebClient(node.url))
+#         assert isinstance(client, (DICOMwebClient, DICOMfileClient))
+#         for accession in accessions:
+#             try:
+#                 response = client.search_for_series(search_filters={'AccessionNumber': accession})
+#                 if not response:
+#                     raise ValueError("No series found with accession number {}".format(accession))
+#             except Exception as e:
+#                 job = cast(Job,self._job)
+#                 job_parent = queue.fetch_job(job.meta.get('parent'))
+#                 job_parent.meta['failed_reason'] = f"Accession {accession} not found on node"
+#                 job_parent.save_meta()
+#                 queue._enqueue_job(job_parent,at_front=True)
+#                 raise
+#         return "Complete"
 
 @dataclass 
 class CheckAccessionsJob(ClassBasedRQJob):
@@ -130,12 +133,15 @@ def execute(self, *, accessions, node, queue=worker_queue):
         """
         Check if the given accessions exist on the node using a DICOM query.
         """
-        c = SimpleDicomClient(node.ip, node.port, node.aet_target, None)
-        assert self.parent is not None
+        # c = SimpleDicomClient(node.ip, node.port, node.aet_target, None)
+        # assert self.parent is not None
         try:
             for accession in accessions:
-                result = c.findscu(accession)
-                logger.info(result)
+                result = get_handler(node).find_from_target(node, accession)
+                if not result:
+                    raise ValueError("No series found with accession number {}".format(accession))
+                # result = c.findscu(accession)
+                # logger.info(result)
         except:
             job_parent = queue.fetch_job(self.parent)
             job_parent.meta['failed_reason'] = f"Accession {accession} not found on node"
@@ -149,18 +155,19 @@ class GetAccessionJob(ClassBasedRQJob):
     offpeak: bool = False
 
     @classmethod
-    def get_accession(cls, job_id, accession, node, path) -> Generator[Tuple[int,int,str], None, str]:
-        config.read_config()
-        c = SimpleDicomClient(node.ip, node.port, node.aet_target, path)
-        for identifier in c.getscu(accession):
-            completed, remaining = identifier.NumberOfCompletedSuboperations, identifier.NumberOfRemainingSuboperations, 
-            progress = f"{ completed } / { completed + remaining }" 
-            yield completed, remaining, progress
-        return "Complete"
+    def get_accession(cls, job_id, accession, node, path) -> Generator[ProgressInfo, None, str]:
+        yield from get_handler(node).get_from_target(node, accession, path)
+        # config.read_config()
+        # c = SimpleDicomClient(node.ip, node.port, node.aet_target, path)
+        # for identifier in c.getscu(accession):
+        #     completed, remaining = identifier.NumberOfCompletedSuboperations, identifier.NumberOfRemainingSuboperations, 
+        #     progress = f"{ completed } / { completed + remaining }" 
+        #     yield completed, remaining, progress
+        # return "Complete"
 
     def execute(self, *,accession, node, path, queue=worker_queue):
         print(f"Getting {accession}")
-        job = self._job
+        job = cast(Job,self._job)
         try:
             Path(path).mkdir(parents=True, exist_ok=True)
             job_parent = None
@@ -174,12 +181,12 @@ def execute(self, *,accession, node, path, queue=worker_queue):
             job.meta['started'] = 1
             job.meta['progress'] = "0 / Unknown"
             job.save_meta() # type: ignore
-            for completed, remaining, progress in self.get_accession(job.id, accession, node, path):
-                job.meta['remaining'] = remaining
-                job.meta['completed'] = completed
-                job.meta['progress'] = progress
+            for info in get_handler(node).get_from_target(node, accession, path):
+                job.meta['remaining'] = info.remaining
+                job.meta['completed'] = info.completed 
+                job.meta['progress'] = info.progress
                 job.save_meta() # type: ignore  # Save the updated meta data to the job
-                logger.info(progress)
+                logger.info(info.progress)
             if job_parent:
                 if job_parent.kwargs["move_promptly"]:
                     self.move_to_destination(path, job_parent.kwargs["destination"], job_parent.id)
@@ -207,33 +214,34 @@ def execute(self, *,accession, node, path, queue=worker_queue):
 
         return "Job complete"
 
-@dataclass
-class GetAccessionDicomWebJob(GetAccessionJob):
-    type: str = "get_accession_dicomweb"
-
-    @classmethod
-    def get_accession(cls, job_id, accession, node, path) -> Generator[Tuple[int,int,str], None, None]:
-        config.read_config()
-        assert isinstance(node, DicomWebNode), f"Invalid node type {type(node)}: expected DicomWebNode"
-        client = (DICOMfileClient(url=node.base_url, in_memory=True) if node.base_url.startswith("file://") 
-                  else DICOMwebClient(node.base_url))
-        assert isinstance(client, (DICOMwebClient, DICOMfileClient))
-        series = client.search_for_series(search_filters={'AccessionNumber': accession})
-        if not series:
-            raise ValueError("No series found with accession number {}".format(accession))
-        n = 0
-        remaining = 0
-        for s in series:
-            instances = client.retrieve_series(s['0020000D']['Value'][0], s['0020000E']['Value'][0])
-            remaining += len(instances)
-            for instance in instances:
-                sop_instance_uid = instance.get('SOPInstanceUID')
-                filename = f"{path}/{sop_instance_uid}.dcm"
-                instance.save_as(filename)
-                n += 1
-                remaining -= 1
-                yield (n, remaining, f'{n} / {n + remaining}')
-
+# @dataclass
+# class GetAccessionDicomWebJob(GetAccessionJob):
+#     type: str = "get_accession_dicomweb"
+
+#     @classmethod
+#     def get_accession(cls, job_id, accession:str, node: DicomWebTarget, path) -> Generator[Tuple[int,int,str], None, str]:
+#         config.read_config()
+#         handler = get_handler(node)
+#         assert isinstance(node, DicomWebTarget), f"Invalid node type {type(node)}: expected DicomWebTarget"
+#         client = (DICOMfileClient(url=node.url, in_memory=True) if node.url.startswith("file://") 
+#                   else DICOMwebClient(node.url))
+#         assert isinstance(client, (DICOMwebClient, DICOMfileClient))
+#         series = client.search_for_series(search_filters={'AccessionNumber': accession})
+#         if not series:
+#             raise ValueError("No series found with accession number {}".format(accession))
+#         n = 0
+#         remaining = 0
+#         for s in series:
+#             instances = client.retrieve_series(s['0020000D']['Value'][0], s['0020000E']['Value'][0])
+#             remaining += len(instances)
+#             for instance in instances:
+#                 sop_instance_uid = instance.get('SOPInstanceUID')
+#                 filename = f"{path}/{sop_instance_uid}.dcm"
+#                 instance.save_as(filename)
+#                 n += 1
+#                 remaining -= 1
+#                 yield (n, remaining, f'{n} / {n + remaining}')
+#         return f'Downloaded {n} instances from accession number {accession}'
 @dataclass
 class MainJob(ClassBasedRQJob):
     type: str = "batch" 
@@ -244,7 +252,7 @@ class MainJob(ClassBasedRQJob):
     offpeak: bool = False
 
     def execute(self, *, accessions, subjobs, path, destination, move_promptly, queue=worker_queue) -> str:
-        job = self._job
+        job = cast(Job,self._job)
         job.get_meta()
         for job_id in job.kwargs.get('subjobs',[]):
             subjob = queue.fetch_job(job_id)
@@ -271,13 +279,13 @@ def execute(self, *, accessions, subjobs, path, destination, move_promptly, queu
 def monitor_job():
     print("monitoring")
 
-class DicomQueryFlow():
-    CheckAccessions = CheckAccessionsJob
-    GetAccession = GetAccessionJob
+# class DicomQueryFlow():
+#     CheckAccessions = CheckAccessionsJob
+#     GetAccession = GetAccessionJob
 
-class DicomWebQueryFlow():
-    CheckAccessions = CheckAccessionsDicomWebJob
-    GetAccession = GetAccessionDicomWebJob
+# class DicomWebQueryFlow():
+#     CheckAccessions = CheckAccessionsDicomWebJob
+#     GetAccession = GetAccessionDicomWebJob
 
 class WrappedJob():
     def __init__(self, job: Union[Job,str], queue):
@@ -289,20 +297,23 @@ def __init__(self, job: Union[Job,str], queue):
         self.queue = queue
 
     @classmethod
-    def create(cls, accessions, dicom_node: DicomNodeBase, destination_path, offpeak=False, queue=worker_queue) -> 'WrappedJob':
+    def create(cls, accessions, dicom_node: Union[DicomWebTarget, DicomTarget], destination_path, offpeak=False, queue=worker_queue) -> 'WrappedJob':
         """
         Create a job to process the given accessions and store them in the specified destination path.
         """
-        if isinstance(dicom_node, DicomNode):
-            DicomFlow = DicomQueryFlow
-        elif isinstance(dicom_node, DicomWebNode):
-            DicomFlow = DicomWebQueryFlow
+        # DicomFlow:Union[Type[DicomQueryFlow], Type[DicomWebQueryFlow]]
+        # if isinstance(dicom_node, DicomTarget):
+        #     DicomFlow = DicomQueryFlow
+        # elif isinstance(dicom_node, DicomWebTarget):
+        #     DicomFlow = DicomWebQueryFlow
+        # else:
+        #     raise ValueError("Invalid dicom_node type {}".format(type(dicom_node)))
 
         with Connection(redis):
             jobs: List[Job] = []
-            check_job = DicomFlow.CheckAccessions().create(accessions=accessions, node=dicom_node)
+            check_job = CheckAccessionsJob().create(accessions=accessions, node=dicom_node)
             for accession in accessions:
-                job = DicomFlow.GetAccession(offpeak=offpeak).create(
+                job = GetAccessionJob(offpeak=offpeak).create(
                     accession=accession, 
                     node=dicom_node,
                     rq_options=dict(
@@ -564,37 +575,36 @@ async def query_post_batch(request):
     Starts a new query job for the given accession number and DICOM node.
     """
     form = await request.form()
-    for n in config.mercure.dicom_retrieve.dicom_nodes:
-        if n.name == form.get("dicom_node"):
-            node = n
-            break
-    destination = form.get("destination")
-    dest_path = None
-    for d in config.mercure.dicom_retrieve.destination_folders:
-        if d.name == destination:
-            dest_path = d.path
-            break
 
+    node = config.mercure.targets.get(form.get("dicom_node"))
+    if not isinstance(node, (DicomWebTarget, DicomTarget)):
+        return JSONResponse({"error": f"Invalid DICOM node"}, status_code=400)
+
+    destination = config.mercure.targets.get(form.get("destination"))
+    if destination and isinstance(destination, FolderTarget):
+        dest_path = destination.folder
+    else:
+        return JSONResponse({"error": "Invalid destination"}, status_code=400)
     # random_accessions = ["".join(random.choices([str(i) for i in range(10)], k=10)) for _ in range(3)]
     offpeak = 'offpeak' in form
     WrappedJob.create(form.get("accession").split(","), node, dest_path, offpeak=offpeak)
     # worker_scheduler.schedule(scheduled_time=datetime.utcnow(), func=monitor_job, interval=10, repeat=10, result_ttl=-1)
     return PlainTextResponse()
  
-@router.post("/query_single")
-@requires(["authenticated", "admin"], redirect="login")
-async def query_post(request):
-    """
-    Starts a new query job for the given accession number and DICOM node.
-    """
-    form = await request.form()
-    for n in config.mercure.dicom_retrieve.dicom_nodes:
-        if n.name == form.get("dicom_node"):
-            node = n
-            break
+# @router.post("/query_single")
+# @requires(["authenticated", "admin"], redirect="login")
+# async def query_post(request):
+#     """
+#     Starts a new query job for the given accession number and DICOM node.
+#     """
+#     form = await request.form()
+#     for n in config.mercure.dicom_retrieve.dicom_nodes:
+#         if n.name == form.get("dicom_node"):
+#             node = n
+#             break
     
-    worker_queue.enqueue_call(QueryJob.get_accession_job, kwargs=dict(accession=form.get("accession"), node=node), timeout=30*60, result_ttl=-1, meta=dict(type="get_accession_single"))
-    return PlainTextResponse()
+#     worker_queue.enqueue_call(QueryJob.get_accession_job, kwargs=dict(accession=form.get("accession"), node=node), timeout=30*60, result_ttl=-1, meta=dict(type="get_accession_single"))
+#     return PlainTextResponse()
 
 
 @router.get("/query/jobs")
@@ -648,10 +658,12 @@ async def query_jobs(request):
 @requires(["authenticated", "admin"], redirect="login")
 async def query(request):
     template = "dashboards/query.html"
+    dicom_nodes = [name for name,node in config.mercure.targets.items() if type(node) in (DicomTarget, DicomWebTarget)]
+    destination_folders = [name for name,node in config.mercure.targets.items() if type(node) == FolderTarget]
     context = {
         "request": request,
-        "destination_folders": config.mercure.dicom_retrieve.destination_folders,
-        "dicom_nodes": config.mercure.dicom_retrieve.dicom_nodes,
+        "destination_folders": destination_folders,
+        "dicom_nodes": dicom_nodes,
         "page": "query",
     }
     return templates.TemplateResponse(template, context)
\ No newline at end of file
diff --git a/webinterface/query.py b/webinterface/query.py
index 9294174a..c16618d4 100644
--- a/webinterface/query.py
+++ b/webinterface/query.py
@@ -60,7 +60,7 @@ class SimpleDicomClient():
     output_dir: str
     def __init__(self, host, port, called_aet, out_dir) -> None:
         self.host = host
-        self.port = port
+        self.port = int(port)
         self.called_aet = called_aet
         self.output_dir = out_dir
     
diff --git a/webinterface/templates/dashboards/query.html b/webinterface/templates/dashboards/query.html
index f34a459d..374ccf4f 100644
--- a/webinterface/templates/dashboards/query.html
+++ b/webinterface/templates/dashboards/query.html
@@ -36,7 +36,7 @@ <h1 class="title">DICOM Query</h1>
                     <div class="select">
                         <select name="dicom_node">
                           {% for node in dicom_nodes %}
-                          <option>{{ node.name }}</option>
+                          <option>{{ node }}</option>
                           {% endfor %}
                         </select>
                       </div>
@@ -56,7 +56,7 @@ <h1 class="title">DICOM Query</h1>
                           <option>Mercure</option>
                           <option disabled>————————</option>
                           {% for destination in destination_folders %}
-                          <option>{{ destination.name }}</option>
+                          <option>{{ destination }}</option>
                           {% endfor %}
                         </select>
                       </div>

From 9df287e707fc66dc7c1a21c059545f83f789ae87 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 30 Aug 2024 16:08:25 +0000
Subject: [PATCH 27/42] fixes

---
 dispatch/target_types/dicomweb.py | 14 +++--
 tests/test_query.py               |  6 +-
 webgui.py                         |  2 +-
 webinterface/dashboards/query.py  | 92 +++++--------------------------
 webinterface/query.py             | 10 ++--
 webinterface/templates/base.html  |  1 +
 6 files changed, 34 insertions(+), 91 deletions(-)

diff --git a/dispatch/target_types/dicomweb.py b/dispatch/target_types/dicomweb.py
index c1bf2d18..1cf11a2d 100644
--- a/dispatch/target_types/dicomweb.py
+++ b/dispatch/target_types/dicomweb.py
@@ -2,7 +2,7 @@
 from typing import Dict, Generator, List
 from dicomweb_client import DICOMfileClient
 from requests.exceptions import HTTPError
-
+import time
 import pydicom
 from common.types import DicomWebTarget, TaskDispatch, Task
 from .base import ProgressInfo, TargetHandler
@@ -29,7 +29,7 @@ def create_client(self, target: DicomWebTarget):
         session = None
         headers = None
         if target.url.startswith("file://"):
-            return DICOMfileClient(url=target.url, in_memory=True)
+            return DICOMfileClient(url=target.url, in_memory=True, update_db=True)
           
         if target.http_user and target.http_password:
             session = create_session_from_user_pass(username=target.http_user, password=target.http_password)
@@ -46,14 +46,14 @@ def create_client(self, target: DicomWebTarget):
         )
         return client
 
-    def find_from_target(self, target: DicomWebTarget, accession: str) -> List[Dict[str,dict]]:
+    def find_from_target(self, target: DicomWebTarget, accession: str) -> List[pydicom.Dataset]:
         client = self.create_client(target)
-        return client.search_for_series(search_filters={'AccessionNumber': accession})
-
+        metadata = client.search_for_series(search_filters={'AccessionNumber': accession}, get_remaining=True)
+        return [pydicom.Dataset.from_json(ds) for ds in metadata]
 
     def get_from_target(self, target: DicomWebTarget, accession, path) -> Generator[ProgressInfo, None, None]:
         client = self.create_client(target)
-        series = client.search_for_series(search_filters={'AccessionNumber': accession})
+        series = client.search_for_series(search_filters={'AccessionNumber': accession}, get_remaining=True)
         if not series:
             raise ValueError("No series found with accession number {}".format(accession))
         n = 0
@@ -67,7 +67,9 @@ def get_from_target(self, target: DicomWebTarget, accession, path) -> Generator[
                 instance.save_as(filename)
                 n += 1
                 remaining -= 1
+                time.sleep(1)
                 yield ProgressInfo(n, remaining, f'{n} / {n + remaining}')
+        time.sleep(1)
 
     def send_to_target(
         self, task_id: str, target: DicomWebTarget, dispatch_info: TaskDispatch, source_folder: Path, task: Task
diff --git a/tests/test_query.py b/tests/test_query.py
index dc30e71d..205bf406 100644
--- a/tests/test_query.py
+++ b/tests/test_query.py
@@ -131,7 +131,7 @@ def test_simple_dicom_client(dicom_server):
 
     result = client.findscu(MOCK_ACCESSION)
     assert result is not None  # We expect some result, even if it's an empty dataset
-    assert result['AccessionNumber'].value == MOCK_ACCESSION  # Check if the accession number matches
+    assert result[0].AccessionNumber == MOCK_ACCESSION  # Check if the accession number matches
 
 @pytest.fixture(scope="function")
 def tempdir():
@@ -149,7 +149,7 @@ def test_get_accession_job(dicom_server, dicomweb_server, mercure_config):
         # Check that we got some results
         assert len(results) > 0
         assert results[0].remaining == 0
-        assert pydicom.dcmread(next(k for k in Path(config.jobs_folder).iterdir()))['AccessionNumber'].value == MOCK_ACCESSION
+        assert pydicom.dcmread(next(k for k in Path(config.jobs_folder).iterdir())).AccessionNumber == MOCK_ACCESSION
 
 def test_query_job(dicom_server, tempdir):
     """
@@ -163,7 +163,7 @@ def test_query_job(dicom_server, tempdir):
     w.work(burst=True)
     # assert len(list(Path(config.mercure.jobs_folder).iterdir())) == 1
     print([k for k in Path(tempdir).rglob('*')])
-    assert pydicom.dcmread(next(k for k in Path(tempdir).rglob("*.dcm")))['AccessionNumber'].value == MOCK_ACCESSION
+    assert pydicom.dcmread(next(k for k in Path(tempdir).rglob("*.dcm"))).AccessionNumber == MOCK_ACCESSION
 
 def tree(path, prefix='', level=0) -> None:
     if level==0:
diff --git a/webgui.py b/webgui.py
index 49484c97..78c7de94 100755
--- a/webgui.py
+++ b/webgui.py
@@ -854,7 +854,7 @@ async def server_error(request, exc) -> Response:
 
 async def emergency_response(request) -> Response:
     """Shows emergency message about invalid configuration."""
-    return PlainTextResponse("ERROR: mercure configuration is invalid. Check configuration and restart webgui service.")
+    return PlainTextResponse("ERROR: mercure configuration is invalid. Check configuration and restart webgui service.", status_code=500)
 
 
 def launch_emergency_app() -> None:
diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query.py
index 4e56692b..e908b55e 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query.py
@@ -64,6 +64,8 @@ class ClassBasedRQJob():
     parent: Optional[str] = None
     type: str = "unknown"
     _job: Optional[Job] = None
+
+    
     def create(self, rq_options={}, **kwargs) -> Job:
         fields = dataclasses.fields(self)
         meta = {field.name: getattr(self, field.name) for field in fields}
@@ -102,34 +104,11 @@ def move_to_destination(path, destination, job_id) -> None:
             # tree(dest_folder)
             logger.info(f"moved")
 
-
-# @dataclass
-# class CheckAccessionsDicomWebJob(ClassBasedRQJob):
-#     type: str = "check_accessions_dicomweb"
-
-#     def execute(self, *, accessions, node: DicomWebTarget, queue=worker_queue): 
-#         client = (DICOMfileClient(url=node.url, in_memory=True) if node.url.startswith("file://") 
-#                   else DICOMwebClient(node.url))
-#         assert isinstance(client, (DICOMwebClient, DICOMfileClient))
-#         for accession in accessions:
-#             try:
-#                 response = client.search_for_series(search_filters={'AccessionNumber': accession})
-#                 if not response:
-#                     raise ValueError("No series found with accession number {}".format(accession))
-#             except Exception as e:
-#                 job = cast(Job,self._job)
-#                 job_parent = queue.fetch_job(job.meta.get('parent'))
-#                 job_parent.meta['failed_reason'] = f"Accession {accession} not found on node"
-#                 job_parent.save_meta()
-#                 queue._enqueue_job(job_parent,at_front=True)
-#                 raise
-#         return "Complete"
-
 @dataclass 
 class CheckAccessionsJob(ClassBasedRQJob):
     type: str = "check_accessions"
 
-    def execute(self, *, accessions, node, queue=worker_queue):
+    def execute(self, *, accessions: List[str], node: Union[DicomTarget, DicomWebTarget], queue=worker_queue):
         """
         Check if the given accessions exist on the node using a DICOM query.
         """
@@ -138,6 +117,7 @@ def execute(self, *, accessions, node, queue=worker_queue):
         try:
             for accession in accessions:
                 result = get_handler(node).find_from_target(node, accession)
+                logger.info(result)
                 if not result:
                     raise ValueError("No series found with accession number {}".format(accession))
                 # result = c.findscu(accession)
@@ -155,17 +135,10 @@ class GetAccessionJob(ClassBasedRQJob):
     offpeak: bool = False
 
     @classmethod
-    def get_accession(cls, job_id, accession, node, path) -> Generator[ProgressInfo, None, str]:
+    def get_accession(cls, job_id, accession: str, node: Union[DicomTarget, DicomWebTarget], path) -> Generator[ProgressInfo, None, None]:
         yield from get_handler(node).get_from_target(node, accession, path)
-        # config.read_config()
-        # c = SimpleDicomClient(node.ip, node.port, node.aet_target, path)
-        # for identifier in c.getscu(accession):
-        #     completed, remaining = identifier.NumberOfCompletedSuboperations, identifier.NumberOfRemainingSuboperations, 
-        #     progress = f"{ completed } / { completed + remaining }" 
-        #     yield completed, remaining, progress
-        # return "Complete"
-
-    def execute(self, *,accession, node, path, queue=worker_queue):
+
+    def execute(self, *, accession:str, node: Union[DicomTarget, DicomWebTarget], path: str, queue=worker_queue):
         print(f"Getting {accession}")
         job = cast(Job,self._job)
         try:
@@ -181,7 +154,7 @@ def execute(self, *,accession, node, path, queue=worker_queue):
             job.meta['started'] = 1
             job.meta['progress'] = "0 / Unknown"
             job.save_meta() # type: ignore
-            for info in get_handler(node).get_from_target(node, accession, path):
+            for info in self.get_accession(job.id, accession=accession, node=node, path=path):
                 job.meta['remaining'] = info.remaining
                 job.meta['completed'] = info.completed 
                 job.meta['progress'] = info.progress
@@ -214,34 +187,6 @@ def execute(self, *,accession, node, path, queue=worker_queue):
 
         return "Job complete"
 
-# @dataclass
-# class GetAccessionDicomWebJob(GetAccessionJob):
-#     type: str = "get_accession_dicomweb"
-
-#     @classmethod
-#     def get_accession(cls, job_id, accession:str, node: DicomWebTarget, path) -> Generator[Tuple[int,int,str], None, str]:
-#         config.read_config()
-#         handler = get_handler(node)
-#         assert isinstance(node, DicomWebTarget), f"Invalid node type {type(node)}: expected DicomWebTarget"
-#         client = (DICOMfileClient(url=node.url, in_memory=True) if node.url.startswith("file://") 
-#                   else DICOMwebClient(node.url))
-#         assert isinstance(client, (DICOMwebClient, DICOMfileClient))
-#         series = client.search_for_series(search_filters={'AccessionNumber': accession})
-#         if not series:
-#             raise ValueError("No series found with accession number {}".format(accession))
-#         n = 0
-#         remaining = 0
-#         for s in series:
-#             instances = client.retrieve_series(s['0020000D']['Value'][0], s['0020000E']['Value'][0])
-#             remaining += len(instances)
-#             for instance in instances:
-#                 sop_instance_uid = instance.get('SOPInstanceUID')
-#                 filename = f"{path}/{sop_instance_uid}.dcm"
-#                 instance.save_as(filename)
-#                 n += 1
-#                 remaining -= 1
-#                 yield (n, remaining, f'{n} / {n + remaining}')
-#         return f'Downloaded {n} instances from accession number {accession}'
 @dataclass
 class MainJob(ClassBasedRQJob):
     type: str = "batch" 
@@ -301,13 +246,6 @@ def create(cls, accessions, dicom_node: Union[DicomWebTarget, DicomTarget], dest
         """
         Create a job to process the given accessions and store them in the specified destination path.
         """
-        # DicomFlow:Union[Type[DicomQueryFlow], Type[DicomWebQueryFlow]]
-        # if isinstance(dicom_node, DicomTarget):
-        #     DicomFlow = DicomQueryFlow
-        # elif isinstance(dicom_node, DicomWebTarget):
-        #     DicomFlow = DicomWebQueryFlow
-        # else:
-        #     raise ValueError("Invalid dicom_node type {}".format(type(dicom_node)))
 
         with Connection(redis):
             jobs: List[Job] = []
@@ -478,12 +416,12 @@ def get_all_jobs(cls, type:str="batch", queue=worker_queue) -> Generator['Wrappe
         Get all jobs of a given type from the queue
         """
         registries = [
-            queue.started_job_registry,  # Returns StartedJobRegistry
-            queue.deferred_job_registry,   # Returns DeferredJobRegistry
-            queue.finished_job_registry,  # Returns FinishedJobRegistry
-            queue.failed_job_registry,  # Returns FailedJobRegistry 
-            queue.scheduled_job_registry,  # Returns ScheduledJobRegistry
-            queue.canceled_job_registry,   # Returns CanceledJobRegistry
+            queue.started_job_registry,     # Returns StartedJobRegistry
+            queue.deferred_job_registry,    # Returns DeferredJobRegistry
+            queue.finished_job_registry,    # Returns FinishedJobRegistry
+            queue.failed_job_registry,      # Returns FailedJobRegistry 
+            queue.scheduled_job_registry,   # Returns ScheduledJobRegistry
+            queue.canceled_job_registry,    # Returns CanceledJobRegistry
         ]
         job_ids = set()
         for registry in registries:
@@ -493,7 +431,7 @@ def get_all_jobs(cls, type:str="batch", queue=worker_queue) -> Generator['Wrappe
             job_ids.add(j_id)
         jobs = (queue.fetch_job(j_id) for j_id in job_ids)
 
-        return (WrappedJob(j,queue) for j in jobs if j.get_meta().get("type") == type)
+        return (WrappedJob(j,queue) for j in jobs if j and j.get_meta().get("type") == type)
 
 def _is_offpeak(offpeak_start: str, offpeak_end: str, current_time) -> bool:
     try:
diff --git a/webinterface/query.py b/webinterface/query.py
index c16618d4..fff27e08 100644
--- a/webinterface/query.py
+++ b/webinterface/query.py
@@ -183,7 +183,7 @@ def getscu(self, accession_number) -> Iterator[Dataset]:
 
         assoc.release()
 
-    def findscu(self,accession_number) -> Optional[Dataset]:
+    def findscu(self,accession_number) -> List[Dataset]:
         # Create application entity
         ae = AE(ae_title="MERCURE")
 
@@ -207,7 +207,7 @@ def findscu(self,accession_number) -> Optional[Dataset]:
                 ds,
                 StudyRootQueryRetrieveInformationModelFind
             )
-
+            results = []
             for (status, identifier) in responses:
                 if not status:
                     print('Connection timed out, was aborted or received invalid response')
@@ -215,11 +215,13 @@ def findscu(self,accession_number) -> Optional[Dataset]:
 
                 if status.Status in [0xFF00, 0xFF01]:
                     # print('C-FIND query status: 0x{0:04x}'.format(status.Status))
-                    return identifier
+                    results.append(identifier)
                 # elif status.Status == 0x0000:
                 #     print("Success")
                 #     break
-            raise DicomClientCouldNotFind()
+            if not results:
+                raise DicomClientCouldNotFind()
+            return results
         finally:
             assoc.release()
 
diff --git a/webinterface/templates/base.html b/webinterface/templates/base.html
index baaa636b..53016ca7 100755
--- a/webinterface/templates/base.html
+++ b/webinterface/templates/base.html
@@ -130,6 +130,7 @@
 
         document.body.addEventListener('htmx:afterRequest', function (evt) {
           if (evt.detail.xhr.status != 200) {
+            let message;
             if ( evt.detail.xhr.responseText == "Internal Server Error" ) {
               message = "Unexpected server error, please check server logs.";
               console.error(message);

From bc1763cb40d0991b14951666cf25e21ba0c3af93 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Wed, 4 Sep 2024 21:53:25 +0000
Subject: [PATCH 28/42] support filter by series and study description

---
 dispatch/target_types/base.py                 |  19 +-
 dispatch/target_types/builtin.py              |  18 +-
 dispatch/target_types/dicomweb.py             |  60 ++++-
 tests/generate_dicoms.py                      |  79 ++++++
 tests/test_query.py                           |  23 +-
 webgui.py                                     |   4 +-
 webinterface/dashboards/__init__.py           |   2 +-
 webinterface/dashboards/query/__init__.py     |   0
 .../dashboards/{query.py => query/jobs.py}    | 236 +++--------------
 webinterface/dashboards/query_routes.py       | 239 ++++++++++++++++++
 webinterface/query.py                         |  20 +-
 webinterface/templates/dashboards/query.html  | 101 +++++++-
 12 files changed, 556 insertions(+), 245 deletions(-)
 create mode 100644 tests/generate_dicoms.py
 create mode 100644 webinterface/dashboards/query/__init__.py
 rename webinterface/dashboards/{query.py => query/jobs.py} (64%)
 create mode 100644 webinterface/dashboards/query_routes.py

diff --git a/dispatch/target_types/base.py b/dispatch/target_types/base.py
index 19807890..6a574745 100644
--- a/dispatch/target_types/base.py
+++ b/dispatch/target_types/base.py
@@ -1,9 +1,12 @@
 from dataclasses import dataclass
+
+from pydicom import Dataset
 from common.types import Task, TaskDispatch, TaskInfo, Rule, Target
 import common.config as config
 from subprocess import CalledProcessError, check_output
 from starlette.responses import JSONResponse
-from typing import Any, Generator, TypeVar, Generic, cast
+from typing import Any, Dict, Generator, List, TypeVar, Generic, cast
+from pydicom.datadict import dictionary_VR, keyword_for_tag, tag_for_keyword
 
 from pathlib import Path
 import subprocess
@@ -35,12 +38,18 @@ def send_to_target(
     ) -> str:
         return ""
 
-    def get_from_target(self, target: TargetTypeVar, accession: str, path:str) -> Generator[ProgressInfo, None, None]:
-        raise Exception()
-
-    def find_from_target(self, target: TargetTypeVar, accession: str) -> bool:
+    class NoSuchTagException(Exception):
+        pass
+    def get_from_target(self, target: TargetTypeVar, accession: str, search_filters: Dict[str,List[str]], path:str) -> Generator[ProgressInfo, None, None]:
         raise Exception()
 
+    def find_from_target(self, target: TargetTypeVar, accession: str, search_filters:Dict[str,List[str]]) -> List[Dataset]:
+        if self is TargetHandler:
+            raise Exception("This method should be overridden by a subclass")
+        for t in search_filters.keys():
+            if not tag_for_keyword(t):
+                raise TargetHandler.NoSuchTagException(f"Invalid search filter: no such tag '{t}'")
+        return []
     def handle_error(self, e, command) -> None:
         pass
 
diff --git a/dispatch/target_types/builtin.py b/dispatch/target_types/builtin.py
index 96a00fed..e4312d92 100644
--- a/dispatch/target_types/builtin.py
+++ b/dispatch/target_types/builtin.py
@@ -1,4 +1,4 @@
-from typing import Generator, Optional
+from typing import Any, Dict, Generator, List, Optional
 
 from pydicom import Dataset
 from common.types import DicomTarget, DicomTLSTarget, SftpTarget, DummyTarget, Task
@@ -13,7 +13,7 @@
 
 from starlette.responses import JSONResponse
 
-from webinterface.query import SimpleDicomClient
+from webinterface.query import DicomClientCouldNotFind, SimpleDicomClient
 
 from .registry import handler_for
 from .base import ProgressInfo, SubprocessTargetHandler, TargetHandler
@@ -59,15 +59,17 @@ def _create_command(self, target: DicomTarget, source_folder: Path, task: Task):
         )
         return command, {}
 
-    def find_from_target(self, target: DicomTarget, accession: str) -> Optional[Dataset]:
+    def find_from_target(self, target: DicomTarget, accession: str,  search_filters:Dict[str,List[str]]) -> List[Dataset]:
         c = SimpleDicomClient(target.ip, target.port, target.aet_target, None)
-        return c.findscu(accession)
-        raise NotImplementedError("DicomTarget does not support find_from_target.")
-
-    def get_from_target(self, target: DicomTarget, accession, path) -> Generator[ProgressInfo, None, None]:
+        try:
+            return c.findscu(accession, search_filters)
+        except DicomClientCouldNotFind as e:
+            return []
+        
+    def get_from_target(self, target: DicomTarget, accession:str, search_filters:Dict[str,List[str]], path) -> Generator[ProgressInfo, None, None]:
         config.read_config()
         c = SimpleDicomClient(target.ip, target.port, target.aet_target, path)
-        for identifier in c.getscu(accession):
+        for identifier in c.getscu(accession, search_filters):
             completed, remaining = identifier.NumberOfCompletedSuboperations, identifier.NumberOfRemainingSuboperations, 
             progress = f"{ completed } / { completed + remaining }" 
             yield ProgressInfo(completed, remaining, progress)
diff --git a/dispatch/target_types/dicomweb.py b/dispatch/target_types/dicomweb.py
index 1cf11a2d..c117360b 100644
--- a/dispatch/target_types/dicomweb.py
+++ b/dispatch/target_types/dicomweb.py
@@ -1,5 +1,6 @@
 from pathlib import Path
-from typing import Dict, Generator, List
+import sqlite3
+from typing import Any, Dict, Generator, List, Union
 from dicomweb_client import DICOMfileClient
 from requests.exceptions import HTTPError
 import time
@@ -25,11 +26,17 @@ class DicomWebTargetHandler(TargetHandler[DicomWebTarget]):
     icon = "fa-share-alt"
     display_name = "DICOMweb"
 
-    def create_client(self, target: DicomWebTarget):
+    def create_client(self, target: DicomWebTarget) -> Union[DICOMfileClient, DICOMwebClient]:
         session = None
         headers = None
         if target.url.startswith("file://"):
-            return DICOMfileClient(url=target.url, in_memory=True, update_db=True)
+            try:
+                return DICOMfileClient(url=target.url, in_memory=False, update_db=True)
+            except sqlite3.OperationalError as e: 
+                # if sqlite3.OperationalError, try in-memory database
+                # Todo: store the db elsewhere if we don't have write access to this folder
+                # This also makes it possible to run tests under pyfakefs since it can't patch sqlite3 
+                return DICOMfileClient(url=target.url, in_memory=True, update_db=True)
           
         if target.http_user and target.http_password:
             session = create_session_from_user_pass(username=target.http_user, password=target.http_password)
@@ -44,32 +51,57 @@ def create_client(self, target: DicomWebTarget):
             session=session,
             headers=headers,
         )
+        client.set_http_retry_params(retry=False, max_attempts=2, wait_exponential_multiplier=100)
+        logger.info(client)
         return client
 
-    def find_from_target(self, target: DicomWebTarget, accession: str) -> List[pydicom.Dataset]:
+    def find_from_target(self, target: DicomWebTarget, accession: str, search_filters: Dict[str,List[str]]={}) -> List[pydicom.Dataset]:
+        super().find_from_target(target, accession, search_filters)
         client = self.create_client(target)
-        metadata = client.search_for_series(search_filters={'AccessionNumber': accession}, get_remaining=True)
-        return [pydicom.Dataset.from_json(ds) for ds in metadata]
+        use_filters = {'AccessionNumber': accession}
+
+        # If there more one value per filter, just get metadata for the entire accession and filter it after.
+        # Some DICOM servers do actually support filtering on lists, but DICOMwebClient does not seem to support this.
+        # See: https://dicom.nema.org/medical/dicom/current/output/html/part18.html#sect_8.3.4.6
+        for filter_values in search_filters.values():
+            if len(filter_values) > 1:
+                break
+        else:
+            use_filters.update({k: v[0] for k,v in search_filters.items()})
+        
+        metadata = client.search_for_series(search_filters=use_filters, get_remaining=True, fields=['StudyInstanceUID', 'SeriesInstanceUID', 'NumberOfSeriesRelatedInstances'] + list(search_filters.keys()))
+        meta_datasets = [pydicom.Dataset.from_json(ds) for ds in metadata]
+        result = []
+        
+         # In case the server didn't filter as strictly as we expected it to, filter again
+        for d in meta_datasets:
+            for filter in search_filters:
+                if d.get(filter) not in search_filters[filter]:
+                    break
+            else:
+                result.append(d)
+        print(result)
+        return result
 
-    def get_from_target(self, target: DicomWebTarget, accession, path) -> Generator[ProgressInfo, None, None]:
-        client = self.create_client(target)
-        series = client.search_for_series(search_filters={'AccessionNumber': accession}, get_remaining=True)
+    def get_from_target(self, target: DicomWebTarget, accession, search_filters, path) -> Generator[ProgressInfo, None, None]:
+        series = self.find_from_target(target, accession, search_filters=search_filters)
         if not series:
             raise ValueError("No series found with accession number {}".format(accession))
         n = 0
-        remaining = 0
+        remaining = sum([int(x.NumberOfSeriesRelatedInstances) for x in series])
+        client = self.create_client(target)
         for s in series:
-            instances = client.retrieve_series(s['0020000D']['Value'][0], s['0020000E']['Value'][0])
-            remaining += len(instances)
+            instances = client.retrieve_series(s.StudyInstanceUID, s.SeriesInstanceUID)
+            # remaining += len(instances)
             for instance in instances:
                 sop_instance_uid = instance.get('SOPInstanceUID')
                 filename = f"{path}/{sop_instance_uid}.dcm"
                 instance.save_as(filename)
                 n += 1
                 remaining -= 1
-                time.sleep(1)
+                time.sleep(0.5)
                 yield ProgressInfo(n, remaining, f'{n} / {n + remaining}')
-        time.sleep(1)
+        time.sleep(0.5)
 
     def send_to_target(
         self, task_id: str, target: DicomWebTarget, dispatch_info: TaskDispatch, source_folder: Path, task: Task
diff --git a/tests/generate_dicoms.py b/tests/generate_dicoms.py
new file mode 100644
index 00000000..70e074c7
--- /dev/null
+++ b/tests/generate_dicoms.py
@@ -0,0 +1,79 @@
+import itertools
+import os
+from pathlib import Path
+
+from pydicom.dataset import FileMetaDataset, Dataset
+from pydicom.uid import generate_uid, ExplicitVRLittleEndian, CTImageStorage
+
+def generate_dicom_files(accession_number, destination_folder:Path, num_files=10, num_studies=2, num_series=2):
+    """
+    Generate a folder of DICOM files with the given accession number.
+
+    :param accession_number: The accession number to use for the DICOM files
+    :param destination_folder: The parent folder where the accession subfolder will be created
+    :param num_files: The number of DICOM files to generate (default: 10)
+    """
+    # Create the accession subfolder
+    
+    for (study_n,series_n,file_n) in itertools.product(range(num_studies), range(num_series), range(num_files)):
+        if file_n == 0:
+            series_uid = generate_uid()
+            if series_n == 0:
+                study_uid = generate_uid()
+        
+        ds = Dataset()
+        ds.PatientName = "Test^Patient"
+        ds.PatientID = "12345"
+        ds.StudyDate = "20210101"
+        ds.AccessionNumber = accession_number
+        ds.is_little_endian = True
+        ds.is_implicit_VR = False
+
+        ds.SOPClassUID = CTImageStorage  # CT Image Storage
+        ds.SOPInstanceUID = generate_uid()
+        ds.InstanceNumber = file_n + 1
+
+        ds.StudyInstanceUID = study_uid
+        ds.StudyDescription = f"study_{study_n + 1}"
+        ds.SeriesInstanceUID = series_uid
+        ds.SeriesNumber = series_n + 1
+        ds.SeriesDescription = f"series_{series_n + 1}"
+
+        ds.PixelData = b"\x00" * (100 * 100 * 2) 
+        ds.NumberOfFrames = "1"
+        ds.Rows = 100
+        ds.Columns = 100
+        ds.PixelSpacing = [2, 2]
+        ds.BitsAllocated = 16
+        ds.BitsStored = 16
+        ds.HighBit = 15
+        ds.PixelRepresentation = 0
+        ds.SamplesPerPixel = 1
+        ds.file_meta = FileMetaDataset()
+        ds.file_meta.TransferSyntaxUID = ExplicitVRLittleEndian
+
+        # Save the DICOM file in the accession subfolder
+        dir = destination_folder / str(accession_number) / ds.StudyDescription / ds.SeriesDescription
+        dir.mkdir(parents=True, exist_ok=True)
+        filename = f"dicom_file_{file_n+1}.dcm"
+
+        ds.save_as(dir / filename, write_like_original=False)
+
+    print(f"Generated {num_files * num_series * num_studies} DICOM files with accession number {accession_number} in { destination_folder / accession_number}")
+
+if __name__ == "__main__":
+    import argparse
+
+    def dir_path(string) -> Path:
+        if (p:=Path(string)).is_dir():
+            return p
+        raise NotADirectoryError(string)
+
+    parser = argparse.ArgumentParser(description="Generate DICOM files with a specific accession number")
+    parser.add_argument("accession_number", help="Accession number for the DICOM files")
+    parser.add_argument("destination_folder", type=dir_path, help="Parent folder where the accession subfolder will be created")
+    parser.add_argument("--num_files", type=int, default=10, help="Number of DICOM files to generate (default: 10)")
+
+    args = parser.parse_args()
+
+    generate_dicom_files(args.accession_number, args.destination_folder, args.num_files)
diff --git a/tests/test_query.py b/tests/test_query.py
index 205bf406..d5a0480e 100644
--- a/tests/test_query.py
+++ b/tests/test_query.py
@@ -9,7 +9,9 @@
 from pydicom.uid import generate_uid
 from pydicom.dataset import Dataset, FileMetaDataset
 from rq import Worker
-from webinterface.dashboards.query import GetAccessionJob, SimpleDicomClient, WrappedJob
+from webinterface.dashboards.query.jobs import GetAccessionJob, WrappedJob
+from webinterface.query import SimpleDicomClient
+
 from common.types import DicomTarget, DicomWebTarget
 from webinterface.common import redis, worker_queue
 
@@ -128,7 +130,7 @@ def dicomweb_server(dummy_dataset, tempdir):
 def test_simple_dicom_client(dicom_server):
     """Test the SimpleDicomClient can connect to and query the DICOM server."""
     client = SimpleDicomClient(dicom_server.ip, dicom_server.port, dicom_server.aet_target, None)
-
+    
     result = client.findscu(MOCK_ACCESSION)
     assert result is not None  # We expect some result, even if it's an empty dataset
     assert result[0].AccessionNumber == MOCK_ACCESSION  # Check if the accession number matches
@@ -142,14 +144,17 @@ def test_get_accession_job(dicom_server, dicomweb_server, mercure_config):
     """Test the get_accession_job function."""
     config = mercure_config()
     job_id = "test_job"
-    
-    for server,job in ((dicom_server, GetAccessionJob), (dicomweb_server, GetAccessionJob)):
-        generator = GetAccessionJob.get_accession(job_id, MOCK_ACCESSION, server, config.jobs_folder)
+    print(config.jobs_folder)
+    assert(Path(config.jobs_folder)).exists()
+    (Path(config.jobs_folder) / "foo/").touch()
+    for server in (dicom_server, dicomweb_server):
+        
+        generator = GetAccessionJob.get_accession(job_id, MOCK_ACCESSION, server, search_filters={}, path=config.jobs_folder)
         results = list(generator)
         # Check that we got some results
         assert len(results) > 0
         assert results[0].remaining == 0
-        assert pydicom.dcmread(next(k for k in Path(config.jobs_folder).iterdir())).AccessionNumber == MOCK_ACCESSION
+        assert pydicom.dcmread(next(k for k in Path(config.jobs_folder).rglob("*.dcm"))).AccessionNumber == MOCK_ACCESSION
 
 def test_query_job(dicom_server, tempdir):
     """
@@ -157,7 +162,7 @@ def test_query_job(dicom_server, tempdir):
     We use mocker to mock the queue and avoid actually creating jobs.
     """
     queue = Queue(connection=redis)
-    job = WrappedJob.create([MOCK_ACCESSION], dicom_server, str(tempdir), queue=queue)
+    job = WrappedJob.create([MOCK_ACCESSION], {}, dicom_server, str(tempdir), queue=queue)
     assert job
     w = SimpleWorker([queue], connection=redis)
     w.work(burst=True)
@@ -181,13 +186,13 @@ def tree(path, prefix='', level=0) -> None:
 def test_query_dicomweb(dicomweb_server, tempdir, dummy_dataset, fs):
     (tempdir / "outdir").mkdir()
     queue = Queue(connection=redis)
-    wrapped_job = WrappedJob.create([MOCK_ACCESSION], dicomweb_server, (tempdir / "outdir"), queue=queue)
+    wrapped_job = WrappedJob.create([MOCK_ACCESSION], {}, dicomweb_server, (tempdir / "outdir"), queue=queue)
     assert wrapped_job
     w = SimpleWorker([queue], connection=redis)
     w.work(burst=True)
     # tree(tempdir / "outdir")
     outfile = (tempdir / "outdir" / wrapped_job.id / dummy_dataset.AccessionNumber /  f"{dummy_dataset.SOPInstanceUID}.dcm")
-    assert outfile.exists(), f"File {outfile} does not exist."
+    assert outfile.exists(), f"Expected output file {outfile} does not exist."
     wrapped_job.get_meta()
     assert wrapped_job.meta['completed'] == 1
     assert wrapped_job.meta['total'] == 1
\ No newline at end of file
diff --git a/webgui.py b/webgui.py
index 78c7de94..44e28bc5 100755
--- a/webgui.py
+++ b/webgui.py
@@ -67,7 +67,7 @@
 import webinterface.api as api
 import webinterface.dashboards as dashboards
 from webinterface.common import *
-
+from webinterface.dashboards.query.jobs import WrappedJob
 from decoRouter import Router as decoRouter
 router = decoRouter()
 
@@ -142,7 +142,7 @@ def startup() -> None:
         worker_scheduler.cancel(job)
     worker_scheduler.schedule(
         scheduled_time=datetime.datetime.utcnow(),
-        func=dashboards.query.WrappedJob.update_all_jobs_offpeak,
+        func=WrappedJob.update_all_jobs_offpeak,
         interval=60,
         meta={"type": "offpeak"},
         repeat=None
diff --git a/webinterface/dashboards/__init__.py b/webinterface/dashboards/__init__.py
index 7fb55b79..00f320b6 100644
--- a/webinterface/dashboards/__init__.py
+++ b/webinterface/dashboards/__init__.py
@@ -1,5 +1,5 @@
 from .common import router
-from . import query, simple
+from . import query_routes, simple
 from starlette.applications import Starlette
 
 
diff --git a/webinterface/dashboards/query/__init__.py b/webinterface/dashboards/query/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/webinterface/dashboards/query.py b/webinterface/dashboards/query/jobs.py
similarity index 64%
rename from webinterface/dashboards/query.py
rename to webinterface/dashboards/query/jobs.py
index e908b55e..224fe894 100644
--- a/webinterface/dashboards/query.py
+++ b/webinterface/dashboards/query/jobs.py
@@ -1,4 +1,5 @@
 
+
 from dataclasses import dataclass
 import dataclasses
 import os
@@ -6,34 +7,27 @@
 import shutil
 from typing import Any, Dict, Generator, List, Optional, Tuple, Type, Union, cast
 import typing
-from typing_extensions import Literal
+
 
 from dicomweb_client import DICOMfileClient
 from common.types import DicomTarget, DicomWebTarget, FolderTarget
 from dispatch.target_types.base import ProgressInfo
 from dispatch.target_types.registry import get_handler
-from webinterface.query import SimpleDicomClient
 # Standard python includes
 from datetime import datetime
-import time, random
+import time
 # Starlette-related includes
-from starlette.authentication import requires
 
 # App-specific includes
-from common.constants import mercure_defs
-from webinterface.common import templates
 import common.config as config
-from starlette.responses import PlainTextResponse, JSONResponse
 from webinterface.common import worker_queue, redis
 from rq import Connection 
 from rq.job import Dependency, JobStatus
-from rq import get_current_job
 from rq.job import Job
-from .common import router
-from dicomweb_client.api import DICOMwebClient
+from rq import get_current_job
 
-logger = config.get_logger()
 
+logger = config.get_logger()
 
 
 
@@ -82,6 +76,8 @@ def _execute(cls, **kwargs) -> Any:
             if f.name in job.meta and not f.name.startswith('_'):
                 meta[f.name] = job.meta[f.name]
         result = cls(**meta, _job=job).execute(**kwargs)
+        if result is None:
+            return b""
         return result
 
     def execute(self, *args, **kwargs) -> Any:
@@ -108,24 +104,36 @@ def move_to_destination(path, destination, job_id) -> None:
 class CheckAccessionsJob(ClassBasedRQJob):
     type: str = "check_accessions"
 
-    def execute(self, *, accessions: List[str], node: Union[DicomTarget, DicomWebTarget], queue=worker_queue):
+    def execute(self, *, accessions: List[str], node: Union[DicomTarget, DicomWebTarget], search_filters:Dict[str,List[str]]={}, queue=worker_queue):
         """
         Check if the given accessions exist on the node using a DICOM query.
         """
         # c = SimpleDicomClient(node.ip, node.port, node.aet_target, None)
         # assert self.parent is not None
+        results = []
         try:
             for accession in accessions:
-                result = get_handler(node).find_from_target(node, accession)
-                logger.info(result)
-                if not result:
+                found_ds_list = get_handler(node).find_from_target(node, accession, search_filters)
+                if not found_ds_list:
                     raise ValueError("No series found with accession number {}".format(accession))
-                # result = c.findscu(accession)
-                # logger.info(result)
+                results.extend(found_ds_list)
+            return results
+        except ValueError as e:
+            self._job.meta['failed_reason'] = e.args[0]
+            self._job.save_meta()
+            if self.parent and (job_parent := queue.fetch_job(self.parent)):
+                job_parent.meta['failed_reason'] = e.args[0]
+                job_parent.save_meta()
+                queue._enqueue_job(job_parent,at_front=True)
+
+            raise
         except:
-            job_parent = queue.fetch_job(self.parent)
-            job_parent.meta['failed_reason'] = f"Accession {accession} not found on node"
-            queue._enqueue_job(job_parent,at_front=True)
+            self._job.meta['failed_reason'] = f"Unexpected error"
+            self._job.save_meta()
+            if self.parent and (job_parent := queue.fetch_job(self.parent)):
+                job_parent.meta['failed_reason'] = "Unknown"
+                job_parent.save_meta()
+                queue._enqueue_job(job_parent,at_front=True)
             raise
 
 @dataclass
@@ -135,10 +143,10 @@ class GetAccessionJob(ClassBasedRQJob):
     offpeak: bool = False
 
     @classmethod
-    def get_accession(cls, job_id, accession: str, node: Union[DicomTarget, DicomWebTarget], path) -> Generator[ProgressInfo, None, None]:
-        yield from get_handler(node).get_from_target(node, accession, path)
+    def get_accession(cls, job_id, accession: str, node: Union[DicomTarget, DicomWebTarget], search_filters: Dict[str, List[str]], path) -> Generator[ProgressInfo, None, None]:
+        yield from get_handler(node).get_from_target(node, accession, search_filters, path)
 
-    def execute(self, *, accession:str, node: Union[DicomTarget, DicomWebTarget], path: str, queue=worker_queue):
+    def execute(self, *, accession:str, node: Union[DicomTarget, DicomWebTarget], search_filters:Dict[str, List[str]], path: str, queue=worker_queue):
         print(f"Getting {accession}")
         job = cast(Job,self._job)
         try:
@@ -154,7 +162,7 @@ def execute(self, *, accession:str, node: Union[DicomTarget, DicomWebTarget], pa
             job.meta['started'] = 1
             job.meta['progress'] = "0 / Unknown"
             job.save_meta() # type: ignore
-            for info in self.get_accession(job.id, accession=accession, node=node, path=path):
+            for info in self.get_accession(job.id, accession=accession, node=node, search_filters=search_filters, path=path):
                 job.meta['remaining'] = info.remaining
                 job.meta['completed'] = info.completed 
                 job.meta['progress'] = info.progress
@@ -214,24 +222,15 @@ def execute(self, *, accessions, subjobs, path, destination, move_promptly, queu
                 if not p.is_dir():
                     continue
                 self.move_to_destination(p, destination, job.id)
+
+        # subprocess.run(["./bin/ubuntu22.04/getdcmtags", filename, self.called_aet, "MERCURE"],check=True)
+
         logger.info(f"Removing job directory {path}")
         # tree(destination)
         shutil.rmtree(path)
 
         return "Job complete"
 
-
-def monitor_job():
-    print("monitoring")
-
-# class DicomQueryFlow():
-#     CheckAccessions = CheckAccessionsJob
-#     GetAccession = GetAccessionJob
-
-# class DicomWebQueryFlow():
-#     CheckAccessions = CheckAccessionsDicomWebJob
-#     GetAccession = GetAccessionDicomWebJob
-
 class WrappedJob():
     def __init__(self, job: Union[Job,str], queue):
         if isinstance(job, str):
@@ -242,18 +241,19 @@ def __init__(self, job: Union[Job,str], queue):
         self.queue = queue
 
     @classmethod
-    def create(cls, accessions, dicom_node: Union[DicomWebTarget, DicomTarget], destination_path, offpeak=False, queue=worker_queue) -> 'WrappedJob':
+    def create(cls, accessions, search_filters:Dict[str, List[str]], dicom_node: Union[DicomWebTarget, DicomTarget], destination_path, offpeak=False, queue=worker_queue) -> 'WrappedJob':
         """
         Create a job to process the given accessions and store them in the specified destination path.
         """
 
         with Connection(redis):
             jobs: List[Job] = []
-            check_job = CheckAccessionsJob().create(accessions=accessions, node=dicom_node)
+            check_job = CheckAccessionsJob().create(accessions=accessions, search_filters=search_filters, node=dicom_node)
             for accession in accessions:
                 job = GetAccessionJob(offpeak=offpeak).create(
                     accession=accession, 
                     node=dicom_node,
+                    search_filters=search_filters,
                     rq_options=dict(
                         depends_on=cast(List[Union[Dependency, Job]],[check_job]),
                         timeout=30*60,
@@ -445,163 +445,3 @@ def _is_offpeak(offpeak_start: str, offpeak_end: str, current_time) -> bool:
         return bool(current_time >= start_time and current_time <= end_time)
     # End time is after midnight
     return bool(current_time >= start_time or current_time <= end_time)
-
- 
-@router.post("/query/retry_job")
-@requires(["authenticated", "admin"], redirect="login")
-async def post_retry_job(request):
-    job = WrappedJob(request.query_params['id'], queue=worker_queue)
-    job.retry()
-    return JSONResponse({})
-
-@router.post("/query/pause_job")
-@requires(["authenticated", "admin"], redirect="login")
-async def post_pause_job(request):
-    job = WrappedJob(request.query_params['id'], queue=worker_queue)
-    if not job:
-        return JSONResponse({'error': 'Job not found'}, status_code=404)
-    if job.is_finished or job.is_failed:
-        return JSONResponse({'error': 'Job is already finished'}, status_code=400)
-    job.pause()
-    return JSONResponse({'status': 'success'}, status_code=200)
-
-@router.post("/query/resume_job")
-@requires(["authenticated", "admin"], redirect="login")
-async def post_resume_job(request):
-    job = WrappedJob(request.query_params['id'], queue=worker_queue)
-    if not job:
-        return JSONResponse({'error': 'Job not found'}, status_code=404)
-    if job.is_finished or job.is_failed:
-        return JSONResponse({'error': 'Job is already finished'}, status_code=400)
-    
-    job.resume()
-    return JSONResponse({'status': 'success'}, status_code=200)
-
-@router.get("/query/job_info")
-@requires(["authenticated", "admin"], redirect="login")
-async def get_job_info(request):
-    job_id = request.query_params['id']
-    job = WrappedJob(job_id, queue=worker_queue)
-    if not job:
-        return JSONResponse({'error': 'Job not found'}, status_code=404)
-    
-    subjob_info:List[Dict[str,Any]] = []
-    for subjob in job.get_subjobs():
-        if not subjob:
-            continue
-        info = {
-                'id': subjob.get_id(),
-                'ended_at': subjob.ended_at.isoformat().split('.')[0] if subjob.ended_at else "", 
-                'created_at_dt':subjob.created_at,
-                'accession': subjob.kwargs['accession'],
-                'progress': subjob.meta.get('progress'),
-                'paused': subjob.meta.get('paused',False),
-                'status': subjob.get_status()
-            }
-        if info['status'] == 'canceled' and info['paused']:
-            info['status'] = 'paused'
-        subjob_info.append(info)
-    subjob_info = sorted(subjob_info, key=lambda x:x['created_at_dt'])
-    return templates.TemplateResponse("dashboards/query_job_fragment.html", {"request":request,"job":job,"subjob_info":subjob_info})
-
-
-
-@router.post("/query")
-@requires(["authenticated", "admin"], redirect="login")
-async def query_post_batch(request):
-    """
-    Starts a new query job for the given accession number and DICOM node.
-    """
-    form = await request.form()
-
-    node = config.mercure.targets.get(form.get("dicom_node"))
-    if not isinstance(node, (DicomWebTarget, DicomTarget)):
-        return JSONResponse({"error": f"Invalid DICOM node"}, status_code=400)
-
-    destination = config.mercure.targets.get(form.get("destination"))
-    if destination and isinstance(destination, FolderTarget):
-        dest_path = destination.folder
-    else:
-        return JSONResponse({"error": "Invalid destination"}, status_code=400)
-    # random_accessions = ["".join(random.choices([str(i) for i in range(10)], k=10)) for _ in range(3)]
-    offpeak = 'offpeak' in form
-    WrappedJob.create(form.get("accession").split(","), node, dest_path, offpeak=offpeak)
-    # worker_scheduler.schedule(scheduled_time=datetime.utcnow(), func=monitor_job, interval=10, repeat=10, result_ttl=-1)
-    return PlainTextResponse()
- 
-# @router.post("/query_single")
-# @requires(["authenticated", "admin"], redirect="login")
-# async def query_post(request):
-#     """
-#     Starts a new query job for the given accession number and DICOM node.
-#     """
-#     form = await request.form()
-#     for n in config.mercure.dicom_retrieve.dicom_nodes:
-#         if n.name == form.get("dicom_node"):
-#             node = n
-#             break
-    
-#     worker_queue.enqueue_call(QueryJob.get_accession_job, kwargs=dict(accession=form.get("accession"), node=node), timeout=30*60, result_ttl=-1, meta=dict(type="get_accession_single"))
-#     return PlainTextResponse()
-
-
-@router.get("/query/jobs")
-@requires(["authenticated", "admin"], redirect="login")
-async def query_jobs(request):
-    """
-    Returns a list of all query jobs. 
-    """
-    job_info = []
-    for job in WrappedJob.get_all_jobs():
-        job_dict = dict(id=job.id, 
-                                status=job.get_status(), 
-                                parameters=dict(accession=job.kwargs.get('accession','')), 
-                                created_at=1000*datetime.timestamp(job.created_at) if job.created_at else "",
-                                enqueued_at=1000*datetime.timestamp(job.enqueued_at) if job.enqueued_at else "", 
-                                result=job.result if job.get_status() != "failed" else job.meta.get("failed_reason",""), 
-                                meta=job.meta,
-                                progress="")
-        # if job.meta.get('completed') and job.meta.get('remaining'):
-        #     job_dict["progress"] = f"{job.meta.get('completed')} / {job.meta.get('completed') + job.meta.get('remaining')}"
-        # if job.meta.get('type',None) == "batch":
-        n_started = job.meta.get('started',0)
-        n_completed = job.meta.get('completed',0)
-        n_total = job.meta.get('total',0)
-
-        if job_dict["status"] == "finished":
-            job_dict["progress"] = f"{n_total} / {n_total}"
-        elif job_dict["status"] in ("deferred","started", "paused", "canceled"):
-            job_dict["progress"] = f"{n_completed} / {n_total}"
-        
-        # if job_dict["status"] == "canceled" and 
-        if job_dict["meta"].get('paused', False) and job_dict["status"] not in ("finished", "failed"):
-            if n_started < n_completed: # TODO: this does not work
-                job_dict["status"] = "pausing"
-            else:
-                job_dict["status"] = "paused"
-
-        if job_dict["status"] in ("deferred", "started"):
-            if n_started == 0:
-                job_dict["status"] = "waiting"
-            elif n_completed < n_total:
-                job_dict["status"] = "running" 
-            elif n_completed == n_total:
-                job_dict["status"] = "finishing" 
-
-        job_info.append(job_dict)
-    return JSONResponse(dict(data=job_info))
-    # return PlainTextResponse(",".join([str(j) for j in all_jobs]))
-
-@router.get("/query")
-@requires(["authenticated", "admin"], redirect="login")
-async def query(request):
-    template = "dashboards/query.html"
-    dicom_nodes = [name for name,node in config.mercure.targets.items() if type(node) in (DicomTarget, DicomWebTarget)]
-    destination_folders = [name for name,node in config.mercure.targets.items() if type(node) == FolderTarget]
-    context = {
-        "request": request,
-        "destination_folders": destination_folders,
-        "dicom_nodes": dicom_nodes,
-        "page": "query",
-    }
-    return templates.TemplateResponse(template, context)
\ No newline at end of file
diff --git a/webinterface/dashboards/query_routes.py b/webinterface/dashboards/query_routes.py
new file mode 100644
index 00000000..cc504a53
--- /dev/null
+++ b/webinterface/dashboards/query_routes.py
@@ -0,0 +1,239 @@
+
+from dataclasses import dataclass
+from pathlib import Path
+from typing import Any, Dict, List
+
+from common.types import DicomTarget, DicomWebTarget, FolderTarget
+from dispatch.target_types.registry import get_handler
+# Standard python includes
+from datetime import datetime
+# Starlette-related includes
+from starlette.authentication import requires
+
+# App-specific includes
+from webinterface.common import templates
+import common.config as config
+from starlette.responses import PlainTextResponse, JSONResponse
+from webinterface.common import worker_queue, redis
+from .common import router
+
+logger = config.get_logger()
+
+from .query.jobs import CheckAccessionsJob, WrappedJob
+ 
+@router.post("/query/retry_job")
+@requires(["authenticated", "admin"], redirect="login")
+async def post_retry_job(request):
+    job = WrappedJob(request.query_params['id'], queue=worker_queue)
+    job.retry()
+    return JSONResponse({})
+
+@router.post("/query/pause_job")
+@requires(["authenticated", "admin"], redirect="login")
+async def post_pause_job(request):
+    job = WrappedJob(request.query_params['id'], queue=worker_queue)
+    if not job:
+        return JSONResponse({'error': 'Job not found'}, status_code=404)
+    if job.is_finished or job.is_failed:
+        return JSONResponse({'error': 'Job is already finished'}, status_code=400)
+    job.pause()
+    return JSONResponse({'status': 'success'}, status_code=200)
+
+@router.post("/query/resume_job")
+@requires(["authenticated", "admin"], redirect="login")
+async def post_resume_job(request):
+    job = WrappedJob(request.query_params['id'], queue=worker_queue)
+    if not job:
+        return JSONResponse({'error': 'Job not found'}, status_code=404)
+    if job.is_finished or job.is_failed:
+        return JSONResponse({'error': 'Job is already finished'}, status_code=400)
+    
+    job.resume()
+    return JSONResponse({'status': 'success'}, status_code=200)
+
+@router.get("/query/job_info")
+@requires(["authenticated", "admin"], redirect="login")
+async def get_job_info(request):
+    job_id = request.query_params['id']
+    job = WrappedJob(job_id, queue=worker_queue)
+    if not job:
+        return JSONResponse({'error': 'Job not found'}, status_code=404)
+    
+    subjob_info:List[Dict[str,Any]] = []
+    for subjob in job.get_subjobs():
+        if not subjob:
+            continue
+        info = {
+                'id': subjob.get_id(),
+                'ended_at': subjob.ended_at.isoformat().split('.')[0] if subjob.ended_at else "", 
+                'created_at_dt':subjob.created_at,
+                'accession': subjob.kwargs['accession'],
+                'progress': subjob.meta.get('progress'),
+                'paused': subjob.meta.get('paused',False),
+                'status': subjob.get_status()
+            }
+        if info['status'] == 'canceled' and info['paused']:
+            info['status'] = 'paused'
+        subjob_info.append(info)
+    subjob_info = sorted(subjob_info, key=lambda x:x['created_at_dt'])
+    return templates.TemplateResponse("dashboards/query_job_fragment.html", {"request":request,"job":job,"subjob_info":subjob_info})
+
+
+
+@router.post("/query")
+@requires(["authenticated", "admin"], redirect="login")
+async def query_post_batch(request):
+    """
+    Starts a new query job for the given accession number and DICOM node.
+    """
+    form = await request.form()
+
+    node = config.mercure.targets.get(form.get("dicom_node"))
+    if not isinstance(node, (DicomWebTarget, DicomTarget)):
+        return JSONResponse({"error": f"Invalid DICOM node"}, status_code=400)
+
+    destination = config.mercure.targets.get(form.get("destination"))
+    if destination and isinstance(destination, FolderTarget):
+        dest_path = destination.folder
+    else:
+        return JSONResponse({"error": "Invalid destination"}, status_code=400)
+    # random_accessions = ["".join(random.choices([str(i) for i in range(10)], k=10)) for _ in range(3)]
+    offpeak = 'offpeak' in form
+
+
+    search_filters = {}
+    if search_filter:= form.get("series_description"):
+        search_filters["SeriesDescription"] = [x.strip() for x in search_filter.split(",")]
+    if search_filter:= form.get("study_description"):
+        search_filters["StudyDescription"] =  [x.strip() for x in search_filter.split(",")]
+
+    WrappedJob.create(form.get("accession").split(","), search_filters, node, dest_path, offpeak=offpeak)
+    # worker_scheduler.schedule(scheduled_time=datetime.utcnow(), func=monitor_job, interval=10, repeat=10, result_ttl=-1)
+    return PlainTextResponse()
+ 
+# @router.post("/query_single")
+# @requires(["authenticated", "admin"], redirect="login")
+# async def query_post(request):
+#     """
+#     Starts a new query job for the given accession number and DICOM node.
+#     """
+#     form = await request.form()
+#     for n in config.mercure.dicom_retrieve.dicom_nodes:
+#         if n.name == form.get("dicom_node"):
+#             node = n
+#             break
+    
+#     worker_queue.enqueue_call(QueryJob.get_accession_job, kwargs=dict(accession=form.get("accession"), node=node), timeout=30*60, result_ttl=-1, meta=dict(type="get_accession_single"))
+#     return PlainTextResponse()
+
+
+@router.get("/query/jobs")
+@requires(["authenticated", "admin"], redirect="login")
+async def query_jobs(request):
+    """
+    Returns a list of all query jobs. 
+    """
+    job_info = []
+    for job in WrappedJob.get_all_jobs():
+        job_dict = dict(id=job.id, 
+                                status=job.get_status(), 
+                                parameters=dict(accession=job.kwargs.get('accession','')), 
+                                created_at=1000*datetime.timestamp(job.created_at) if job.created_at else "",
+                                enqueued_at=1000*datetime.timestamp(job.enqueued_at) if job.enqueued_at else "", 
+                                result=job.result if job.get_status() != "failed" else job.meta.get("failed_reason",""), 
+                                meta=job.meta,
+                                progress="")
+        # if job.meta.get('completed') and job.meta.get('remaining'):
+        #     job_dict["progress"] = f"{job.meta.get('completed')} / {job.meta.get('completed') + job.meta.get('remaining')}"
+        # if job.meta.get('type',None) == "batch":
+        n_started = job.meta.get('started',0)
+        n_completed = job.meta.get('completed',0)
+        n_total = job.meta.get('total',0)
+
+        if job_dict["status"] == "finished":
+            job_dict["progress"] = f"{n_total} / {n_total}"
+        elif job_dict["status"] in ("deferred","started", "paused", "canceled"):
+            job_dict["progress"] = f"{n_completed} / {n_total}"
+        
+        # if job_dict["status"] == "canceled" and 
+        if job_dict["meta"].get('paused', False) and job_dict["status"] not in ("finished", "failed"):
+            if n_started < n_completed: # TODO: this does not work
+                job_dict["status"] = "pausing"
+            else:
+                job_dict["status"] = "paused"
+
+        if job_dict["status"] in ("deferred", "started"):
+            if n_started == 0:
+                job_dict["status"] = "waiting"
+            elif n_completed < n_total:
+                job_dict["status"] = "running" 
+            elif n_completed == n_total:
+                job_dict["status"] = "finishing" 
+
+        job_info.append(job_dict)
+    return JSONResponse(dict(data=job_info))
+    # return PlainTextResponse(",".join([str(j) for j in all_jobs]))
+
+@router.get("/query")
+@requires(["authenticated", "admin"], redirect="login")
+async def query(request):
+    template = "dashboards/query.html"
+    dicom_nodes = [name for name,node in config.mercure.targets.items() if type(node) in (DicomTarget, DicomWebTarget)]
+    destination_folders = [name for name,node in config.mercure.targets.items() if type(node) == FolderTarget]
+    context = {
+        "request": request,
+        "destination_folders": destination_folders,
+        "dicom_nodes": dicom_nodes,
+        "page": "query",
+    }
+    return templates.TemplateResponse(template, context)
+from webinterface.common import worker_queue, redis
+from rq import Connection 
+
+@router.post("/query/check_accessions")
+@requires(["authenticated", "admin"], redirect="login")
+async def check_accessions(request):
+    form = await request.form()
+    job_id = form.get("job_id")
+
+    if job_id:
+        # Retrieve results for an existing job
+        job = worker_queue.fetch_job(job_id)
+        if not job:
+            return JSONResponse({"error": "Job not found"}, status_code=404)
+        elif job.is_failed:
+            job.get_meta()
+            logger.warning(job.meta)
+            if failed_reason:=job.meta.get("failed_reason"):
+                return JSONResponse({"status": "failed", "info": failed_reason})
+            else:
+                return JSONResponse({"status": "failed", "info": "Unknown error"})
+        elif job.is_finished:
+            result_data = []
+            for d in job.result:
+                result_data.append( {x:d.get(x) for x in ["AccessionNumber", "PatientID", "StudyInstanceUID", "SeriesInstanceUID", "StudyDescription", "SeriesDescription", "NumberOfSeriesRelatedInstances"]} )
+            return JSONResponse({"status": "completed", "result": result_data})
+        
+
+        return JSONResponse({"status": "pending", "job_id": job.id})
+
+    node_name = form.get("dicom_node")
+    accessions = form.get("accessions", "").split(",")
+    
+    series_descriptions = form.get("series_descriptions")
+    study_descriptions = form.get("study_descriptions")
+
+    search_filters = {}
+    if search_filter:= form.get("series_description"):
+        search_filters["SeriesDescription"] = [x.strip() for x in search_filter.split(",")]
+    if search_filter:= form.get("study_description"):
+        search_filters["StudyDescription"] =  [x.strip() for x in search_filter.split(",")]
+
+    node = config.mercure.targets.get(node_name)
+    if not isinstance(node, (DicomWebTarget, DicomTarget)):
+        return JSONResponse({"error": f"Invalid DICOM node"}, status_code=400)
+    
+    with Connection(redis):
+        job = CheckAccessionsJob().create(accessions=accessions, node=node, search_filters=search_filters)
+        worker_queue.enqueue_job(job)
+    return JSONResponse({"status": "pending", "job_id": job.id})
\ No newline at end of file
diff --git a/webinterface/query.py b/webinterface/query.py
index fff27e08..01e525e5 100644
--- a/webinterface/query.py
+++ b/webinterface/query.py
@@ -1,6 +1,6 @@
 import os
 import re
-from typing import Any, Iterator, List, Optional, Sequence, cast
+from typing import Any, Dict, Iterator, List, Optional, Sequence, cast
 from pynetdicom import (
         AE,
         QueryRetrievePresentationContexts, BasicWorklistManagementPresentationContexts, UnifiedProcedurePresentationContexts,
@@ -120,11 +120,10 @@ def handle_store(self, event):
             # Failed - Out of Resources - Miscellaneous error
             status_ds.Status = 0xA701
 
-        subprocess.run(["./bin/ubuntu22.04/getdcmtags", filename, self.called_aet, "MERCURE"],check=True)
         return status_ds
 
 
-    def getscu(self, accession_number) -> Iterator[Dataset]:
+    def getscu(self, accession_number: str, search_filters: Dict[str, List[str]]) -> Iterator[Dataset]:
         # Exclude these SOP Classes
         _exclusion = [
             EncapsulatedSTLStorage,
@@ -164,8 +163,10 @@ def getscu(self, accession_number) -> Iterator[Dataset]:
             # Send query
 
         ds = Dataset()
-        ds.QueryRetrieveLevel = 'STUDY'
+        ds.QueryRetrieveLevel = 'SERIES'
         ds.AccessionNumber = accession_number
+        for key in search_filters:
+            setattr(ds, key, "\\".join(search_filters.get(key,[])))
 
         responses = assoc.send_c_get(ds, query_model)
         success = False
@@ -183,7 +184,7 @@ def getscu(self, accession_number) -> Iterator[Dataset]:
 
         assoc.release()
 
-    def findscu(self,accession_number) -> List[Dataset]:
+    def findscu(self,accession_number, search_filters={}) -> List[Dataset]:
         # Create application entity
         ae = AE(ae_title="MERCURE")
 
@@ -197,8 +198,15 @@ def findscu(self,accession_number) -> List[Dataset]:
         assoc = ae.associate(self.host, self.port, ae_title=self.called_aet, max_pdu=0, ext_neg=[])
 
         ds = Dataset()
-        ds.QueryRetrieveLevel = 'STUDY'
+        ds.QueryRetrieveLevel = 'SERIES'
         ds.AccessionNumber = accession_number
+        ds.SeriesInstanceUID = ''
+        ds.StudyInstanceUID = ''
+        ds.Modality = ''
+        ds.NumberOfSeriesRelatedInstances = ''
+        for key in search_filters:
+            setattr(ds, key, "\\".join(search_filters.get(key,[])))
+
         if not assoc.is_established:
             raise DicomClientCouldNotAssociate()
 
diff --git a/webinterface/templates/dashboards/query.html b/webinterface/templates/dashboards/query.html
index 374ccf4f..739631eb 100644
--- a/webinterface/templates/dashboards/query.html
+++ b/webinterface/templates/dashboards/query.html
@@ -26,6 +26,37 @@ <h1 class="title">DICOM Query</h1>
                 </div>
               </div>
             </div>
+
+            <div class="field is-horizontal">
+              <div class="field-label is-normal">
+                <label class="label">Study Description</label>
+              </div>
+              <div class="field-body">
+                <div class="field">
+                  <div class="control is-expanded">
+                    <div class="control">
+                        <input name="study_description" class="input" type="text" placeholder="" value="">
+                      </div>
+                  </div>
+                </div>
+              </div>
+            </div>
+
+            <div class="field is-horizontal">
+              <div class="field-label is-normal">
+                <label class="label">Series Description</label>
+              </div>
+              <div class="field-body">
+                <div class="field">
+                  <div class="control is-expanded">
+                    <div class="control">
+                        <input name="series_description" class="input" type="text" placeholder="" value="">
+                      </div>
+                  </div>
+                </div>
+              </div>
+            </div>
+
             <div class="field is-horizontal">
               <div class="field-label is-normal">
                 <label class="label">Dicom Node</label>
@@ -74,7 +105,7 @@ <h1 class="title">DICOM Query</h1>
                   <div class="control is-expanded">
                     <label class="checkbox">
                       <input type="checkbox" id="offpeak" name="offpeak" value="">
-                    </div>
+                    </label>
                   </div>
                 </div>
               </div>
@@ -90,13 +121,28 @@ <h1 class="title">DICOM Query</h1>
                     <button type="submit" class="button is-primary">
                       Query
                     </button>
+                    <button type="button" id="check-accessions" class="button is-info">
+                      Check Accessions
+                    </button>
                   </div>
                 </div>
               </div>
             </div>
           </form>
           <div id="query_result"></div>
-        <div class="columns">
+          <div id="check-accessions-result" style="display: none;">
+            <table id="check-accessions-table" class="table is-narrow is-hoverable is-fullwidth">
+              <thead>
+                <tr>
+                  <th>Accession</th>
+                  <th>Study Description</th>
+                  <th>Series Description</th>
+                  <th>Instances</th>
+                </tr>
+              </thead>
+            </table>
+          </div>
+          <div class="columns">
 
         <div class="column">
             <table class="table is-narrow is-hoverable is-fullwidth jobtable" id="casetable">
@@ -244,6 +290,57 @@ <h1 class="title">DICOM Query</h1>
         initComplete: function() {             
         }
     });
+    var jobId;
+    var errMessage;
+    $('#check-accessions').on('click', function(e) {
+        e.preventDefault();
+        var accessions = $('input[name="accession"]').val();
+        var dicomNode = $('select[name="dicom_node"]').val();
+        errMessage = null;
+        $('#check-accessions-result').show();
+
+        if ($.fn.DataTable.isDataTable('#check-accessions-table')) {
+            $('#check-accessions-table').DataTable().destroy();
+        }
+
+        $('#check-accessions-table').DataTable({
+            ajax: {
+                url: "query/check_accessions",
+                type: "POST",
+                data: function(d) {
+                    return {
+                        accessions: accessions,
+                        series_description: $('input[name="series_description"]').val(),
+                        study_description: $('input[name="study_description"]').val(),
+                        dicom_node: dicomNode,
+                        job_id: jobId
+                    };
+                },
+                dataSrc: function(json) {
+                    console.log("Data: ", json)
+                    if (json.status === "pending") {
+                        jobId = json.job_id;
+                        setTimeout(function() {
+                            $('#check-accessions-table').DataTable().ajax.reload();
+                        }, 1000);
+                        return [];
+                    } else if (json.status === "completed") {
+                      jobId = null;
+                      return json.result
+                    } else if (json.status === "failed") {
+                      jobId = null;
+                      errMessage = json.info;
+                      return [];
+                    }
+                }
+            },
+            columns: [{ data: 'AccessionNumber' }, {data: 'StudyDescription'},  { data: 'SeriesDescription' }, {data: 'NumberOfSeriesRelatedInstances'}], 
+            order: [[0, 'asc']],
+            pageLength: 25,
+            language: { "emptyTable": ()=> errMessage || "No series found or query in progress." } 
+            }); 
+    });
+
     window.datatable.on('click', 'td.dt-control', function (e) {
       let tr = e.target.closest('tr');
       let row = window.datatable.row(tr);

From 77ec9184f4c976960ebf26f501360514f3f3a6d3 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Wed, 4 Sep 2024 22:35:00 +0000
Subject: [PATCH 29/42] add "direction" field to Target

---
 common/types.py                              |  1 +
 webinterface/dashboards/query_routes.py      |  2 +-
 webinterface/rules.py                        |  2 +-
 webinterface/templates/dashboards/query.html |  2 +-
 webinterface/templates/rules_edit.html       |  3 +--
 webinterface/templates/targets.html          |  4 ++++
 webinterface/templates/targets_edit.html     | 15 +++++++++++++++
 7 files changed, 24 insertions(+), 5 deletions(-)

diff --git a/common/types.py b/common/types.py
index f200c931..fd9ee39e 100755
--- a/common/types.py
+++ b/common/types.py
@@ -25,6 +25,7 @@ class Target(BaseModel, Compat):
     target_type: Any
     contact: Optional[str] = ""
     comment: str = ""
+    direction: Optional[Literal["pull", "push", "both"]] = "push"
 
     @classmethod
     def __get_validators__(cls):
diff --git a/webinterface/dashboards/query_routes.py b/webinterface/dashboards/query_routes.py
index cc504a53..2d21d1ec 100644
--- a/webinterface/dashboards/query_routes.py
+++ b/webinterface/dashboards/query_routes.py
@@ -178,7 +178,7 @@ async def query_jobs(request):
 @requires(["authenticated", "admin"], redirect="login")
 async def query(request):
     template = "dashboards/query.html"
-    dicom_nodes = [name for name,node in config.mercure.targets.items() if type(node) in (DicomTarget, DicomWebTarget)]
+    dicom_nodes = [name for name,node in config.mercure.targets.items() if type(node) in (DicomTarget, DicomWebTarget) and node.direction in ("pull", "both")]
     destination_folders = [name for name,node in config.mercure.targets.items() if type(node) == FolderTarget]
     context = {
         "request": request,
diff --git a/webinterface/rules.py b/webinterface/rules.py
index 595f029e..213dc833 100755
--- a/webinterface/rules.py
+++ b/webinterface/rules.py
@@ -114,7 +114,7 @@ async def rules_edit(request) -> Response:
         "request": request,
         "page": "rules",
         "rules": config.mercure.rules,
-        "targets": config.mercure.targets,
+        "targets": [t for t in config.mercure.targets if config.mercure.targets[t].direction in ("push", "both")],
         "modules": config.mercure.modules,
         "rule": rule,
         "alltags": tagslist.alltags,
diff --git a/webinterface/templates/dashboards/query.html b/webinterface/templates/dashboards/query.html
index 739631eb..40ee6e89 100644
--- a/webinterface/templates/dashboards/query.html
+++ b/webinterface/templates/dashboards/query.html
@@ -67,7 +67,7 @@ <h1 class="title">DICOM Query</h1>
                     <div class="select">
                         <select name="dicom_node">
                           {% for node in dicom_nodes %}
-                          <option>{{ node }}</option>
+                              <option>{{ node }}</option>
                           {% endfor %}
                         </select>
                       </div>
diff --git a/webinterface/templates/rules_edit.html b/webinterface/templates/rules_edit.html
index f4821e7a..ea5ca937 100755
--- a/webinterface/templates/rules_edit.html
+++ b/webinterface/templates/rules_edit.html
@@ -293,8 +293,7 @@ <h1 class="title">Edit Rule - {{rule}}</h1>
                             <div class="control">
                                 <select name="target">
                                     {% for t in targets %}
-                                    <option value="{{t}}" {% if rules[rule]['target']==t %}selected{% endif%}>{{ t }}
-                                    </option>
+                                    <option value="{{t}}" {% if rules[rule]['target']==t %}selected{% endif%}>{{ t }}</option>
                                     {% endfor %}
                                 </select>
                             </div>
diff --git a/webinterface/templates/targets.html b/webinterface/templates/targets.html
index c9c706bf..1f97e392 100755
--- a/webinterface/templates/targets.html
+++ b/webinterface/templates/targets.html
@@ -22,6 +22,10 @@ <h1 class="title">Routing Targets</h1>
                     <table class="table is-narrow" style="margin-bottom: 8px;">
                         <col width="150">
                         {% include get_target_handler(targets[x]).view_template %}
+                        <tr>
+                            <td>Direction:</td>
+                            <td>{{ targets[x].direction }}</td>
+                        </tr>
                         <tr>
                             <td>Contact:</td>
                             <td>{{ targets[x].contact }}</td>
diff --git a/webinterface/templates/targets_edit.html b/webinterface/templates/targets_edit.html
index 5fd7ab4f..bc6dc8d8 100755
--- a/webinterface/templates/targets_edit.html
+++ b/webinterface/templates/targets_edit.html
@@ -41,6 +41,21 @@ <h1 class="title">Edit Target - {{edittarget}}</h1>
                         </div>
                     </div>
 
+
+                    <div class="field">
+                        <label class="label">Direction</label>
+                        <div class="select">
+                            <div class="control">
+                                <select name="direction" id="direction" value="{{targets[edittarget].direction}}">
+                                    <option value="push" {% if targets[edittarget].direction=="push" %}selected=true {%endif%}>push</option>
+                                    <option value="pull" {% if targets[edittarget].direction=="pull" %}selected=true {%endif%}>pull</option>
+                                    <option value="both" {% if targets[edittarget].direction=="both" %}selected=true {%endif%}>both</option>
+                                </select>
+                            </div>
+                        </div>
+                    </div>
+
+
                     {% for t in target_types %}
                     <div id="form-{{t.get_name()}}" class="target-form {% if not loop.index0 %}is-hidden{% endif %}">
                         {% include get_target_handler(t).edit_template %}

From 5fa9aa7a3364a2121281c3a68aef78386b06b38c Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Wed, 4 Sep 2024 22:49:25 +0000
Subject: [PATCH 30/42] only offer to set targets to "pull" if they can
 actually query

---
 dispatch/target_types/base.py            |  2 +-
 dispatch/target_types/builtin.py         |  1 +
 dispatch/target_types/dicomweb.py        |  3 ++-
 webinterface/templates/targets_edit.html | 30 +++++++++++-------------
 4 files changed, 18 insertions(+), 18 deletions(-)

diff --git a/dispatch/target_types/base.py b/dispatch/target_types/base.py
index 6a574745..ba4764b0 100644
--- a/dispatch/target_types/base.py
+++ b/dispatch/target_types/base.py
@@ -24,7 +24,7 @@ class ProgressInfo():
 
 class TargetHandler(Generic[TargetTypeVar]):
     test_template = "targets/base-test.html"
-
+    can_pull = False
     def __init__(self):
         pass
 
diff --git a/dispatch/target_types/builtin.py b/dispatch/target_types/builtin.py
index e4312d92..9d92b62c 100644
--- a/dispatch/target_types/builtin.py
+++ b/dispatch/target_types/builtin.py
@@ -39,6 +39,7 @@ class DicomTargetHandler(SubprocessTargetHandler[DicomTarget]):
     test_template = "targets/dicom-test.html"
     icon = "fa-database"
     display_name = "DICOM"
+    can_pull = True
 
     def _create_command(self, target: DicomTarget, source_folder: Path, task: Task):
         target_ip = target.ip
diff --git a/dispatch/target_types/dicomweb.py b/dispatch/target_types/dicomweb.py
index c117360b..d876025b 100644
--- a/dispatch/target_types/dicomweb.py
+++ b/dispatch/target_types/dicomweb.py
@@ -25,7 +25,8 @@ class DicomWebTargetHandler(TargetHandler[DicomWebTarget]):
     # test_template = "targets/dicomweb-test.html"
     icon = "fa-share-alt"
     display_name = "DICOMweb"
-
+    can_pull = True
+    
     def create_client(self, target: DicomWebTarget) -> Union[DICOMfileClient, DICOMwebClient]:
         session = None
         headers = None
diff --git a/webinterface/templates/targets_edit.html b/webinterface/templates/targets_edit.html
index bc6dc8d8..379520cc 100755
--- a/webinterface/templates/targets_edit.html
+++ b/webinterface/templates/targets_edit.html
@@ -40,24 +40,22 @@ <h1 class="title">Edit Target - {{edittarget}}</h1>
                             </div>
                         </div>
                     </div>
-
-
-                    <div class="field">
-                        <label class="label">Direction</label>
-                        <div class="select">
-                            <div class="control">
-                                <select name="direction" id="direction" value="{{targets[edittarget].direction}}">
-                                    <option value="push" {% if targets[edittarget].direction=="push" %}selected=true {%endif%}>push</option>
-                                    <option value="pull" {% if targets[edittarget].direction=="pull" %}selected=true {%endif%}>pull</option>
-                                    <option value="both" {% if targets[edittarget].direction=="both" %}selected=true {%endif%}>both</option>
-                                </select>
-                            </div>
-                        </div>
-                    </div>
-
-
                     {% for t in target_types %}
                     <div id="form-{{t.get_name()}}" class="target-form {% if not loop.index0 %}is-hidden{% endif %}">
+                        {% if get_target_handler(t).can_pull %}
+                        <div class="field">
+                            <label class="label">Direction</label>
+                            <div class="select">
+                                <div class="control">
+                                    <select name="direction" id="direction" value="{{targets[edittarget].direction}}">
+                                        <option value="push" {% if targets[edittarget].direction=="push" %}selected=true {%endif%}>push</option>
+                                        <option value="pull" {% if targets[edittarget].direction=="pull" %}selected=true {%endif%}>pull</option>
+                                        <option value="both" {% if targets[edittarget].direction=="both" %}selected=true {%endif%}>both</option>
+                                    </select>
+                                </div>
+                            </div>
+                        </div>
+                        {% endif %}
                         {% include get_target_handler(t).edit_template %}
                     </div>
                     {%endfor%}

From 01c47341f963122e76ce15166f43fbfdbd0be728 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 6 Sep 2024 22:33:34 +0000
Subject: [PATCH 31/42] multiple queues

---
 dispatch/target_types/dicomweb.py             |  34 +++--
 installation/mercure_worker_fast@.service     |  17 +++
 installation/mercure_worker_slow@.service     |  17 +++
 tests/test_query.py                           |  12 +-
 webgui.py                                     |   6 +-
 webinterface/common.py                        |   8 +-
 webinterface/dashboards/query/jobs.py         | 130 +++++++++---------
 webinterface/dashboards/query_routes.py       |  19 +--
 webinterface/query.py                         |   4 +-
 webinterface/templates/targets/base-test.html |   2 +-
 10 files changed, 150 insertions(+), 99 deletions(-)
 create mode 100644 installation/mercure_worker_fast@.service
 create mode 100644 installation/mercure_worker_slow@.service

diff --git a/dispatch/target_types/dicomweb.py b/dispatch/target_types/dicomweb.py
index d876025b..ab7fa025 100644
--- a/dispatch/target_types/dicomweb.py
+++ b/dispatch/target_types/dicomweb.py
@@ -1,3 +1,4 @@
+import os
 from pathlib import Path
 import sqlite3
 from typing import Any, Dict, Generator, List, Union
@@ -134,20 +135,31 @@ def from_form(self, form: dict, factory, current_target) -> DicomWebTarget:
     async def test_connection(self, target: DicomWebTarget, target_name: str):
         client = self.create_client(target)
 
-        results = {}
-        try:
-            result = client._http_get(target.url)
-            results["authentication"] = True
-        except HTTPError as e:
-            if e.errno == 401:
-                results["authentication"] = False
+        results: Dict[str, Union[bool, str, None]] = {}
+        results["Authentication"] = None
+        if isinstance(client, DICOMwebClient):
+            try:
+                result = client._http_get(target.url)
+                results["Authentication"] = True
+            except HTTPError as e:
+                if e.errno == 401:
+                    results["Authentication"] = False
+                else:
+                    results["Authentication"] = True
+        elif isinstance(client, DICOMfileClient):
+            folder = Path(target.url[7:])
+            if not folder.exists() or not folder.is_dir():
+                results["Authentication"] = f"No such folder {folder}"
+            elif target.direction in ("pull", "both") and not os.access(folder, os.R_OK):
+                results["Authentication"] = f"No read access to folder {folder}"
+            elif target.direction in ("push", "both") and not os.access(folder, os.W_OK):
+                results["Authentication"] = f"No write access to folder {folder}"
             else:
-                results["authentication"] = True
-
+                results["Authentication"] = True
         try:
             client.search_for_studies(limit=1)
-            results["QIDO_query"] = True
+            results["QIDO query"] = True
         except HTTPError as e:
-            results["QIDO_query"] = False
+            results["QIDO query"] = False
 
         return results
diff --git a/installation/mercure_worker_fast@.service b/installation/mercure_worker_fast@.service
new file mode 100644
index 00000000..b2153587
--- /dev/null
+++ b/installation/mercure_worker_fast@.service
@@ -0,0 +1,17 @@
+[Unit]
+Description=Mercure RQ Worker (Fast) %i
+Documentation=https://mercure-imaging.org/docs
+After=network.target mercure_ui.service
+
+[Service]
+Type=simple
+WorkingDirectory=/opt/mercure/app
+ExecStart=/opt/mercure/env/bin/rq worker mercure_fast
+ExecReload=/bin/kill -s HUP $MAINPID
+ExecStop=/bin/kill -s TERM $MAINPID
+User=mercure
+PrivateTmp=true
+Restart=always
+
+[Install]
+WantedBy=multi-user.target
\ No newline at end of file
diff --git a/installation/mercure_worker_slow@.service b/installation/mercure_worker_slow@.service
new file mode 100644
index 00000000..68ef360d
--- /dev/null
+++ b/installation/mercure_worker_slow@.service
@@ -0,0 +1,17 @@
+[Unit]
+Description=Mercure RQ Worker (Slow) %i
+Documentation=https://mercure-imaging.org/docs
+After=network.target mercure_ui.service
+
+[Service]
+Type=simple
+WorkingDirectory=/opt/mercure/app
+ExecStart=/opt/mercure/env/bin/rq worker mercure_slow
+ExecReload=/bin/kill -s HUP $MAINPID
+ExecStop=/bin/kill -s TERM $MAINPID
+User=mercure
+PrivateTmp=true
+Restart=always
+
+[Install]
+WantedBy=multi-user.target
\ No newline at end of file
diff --git a/tests/test_query.py b/tests/test_query.py
index d5a0480e..93e71293 100644
--- a/tests/test_query.py
+++ b/tests/test_query.py
@@ -13,7 +13,7 @@
 from webinterface.query import SimpleDicomClient
 
 from common.types import DicomTarget, DicomWebTarget
-from webinterface.common import redis, worker_queue
+from webinterface.common import redis
 
 from pydicom.uid import ExplicitVRLittleEndian, ImplicitVRLittleEndian
 from testing_common import receiver_port, mercure_config
@@ -161,10 +161,9 @@ def test_query_job(dicom_server, tempdir):
     Test the create_job function.
     We use mocker to mock the queue and avoid actually creating jobs.
     """
-    queue = Queue(connection=redis)
-    job = WrappedJob.create([MOCK_ACCESSION], {}, dicom_server, str(tempdir), queue=queue)
+    job = WrappedJob.create([MOCK_ACCESSION], {}, dicom_server, str(tempdir))
     assert job
-    w = SimpleWorker([queue], connection=redis)
+    w = SimpleWorker(["mercure_fast", "mercure_slow"], connection=redis)
     w.work(burst=True)
     # assert len(list(Path(config.mercure.jobs_folder).iterdir())) == 1
     print([k for k in Path(tempdir).rglob('*')])
@@ -185,10 +184,9 @@ def tree(path, prefix='', level=0) -> None:
 
 def test_query_dicomweb(dicomweb_server, tempdir, dummy_dataset, fs):
     (tempdir / "outdir").mkdir()
-    queue = Queue(connection=redis)
-    wrapped_job = WrappedJob.create([MOCK_ACCESSION], {}, dicomweb_server, (tempdir / "outdir"), queue=queue)
+    wrapped_job = WrappedJob.create([MOCK_ACCESSION], {}, dicomweb_server, (tempdir / "outdir"))
     assert wrapped_job
-    w = SimpleWorker([queue], connection=redis)
+    w = SimpleWorker(["mercure_fast", "mercure_slow"], connection=redis)
     w.work(burst=True)
     # tree(tempdir / "outdir")
     outfile = (tempdir / "outdir" / wrapped_job.id / dummy_dataset.AccessionNumber /  f"{dummy_dataset.SOPInstanceUID}.dcm")
diff --git a/webgui.py b/webgui.py
index 44e28bc5..43688dc9 100755
--- a/webgui.py
+++ b/webgui.py
@@ -135,12 +135,12 @@ async def lifespan(app):
 
 
 def startup() -> None:
-    scheduled_jobs = worker_scheduler.get_jobs()
+    scheduled_jobs = rq_fast_scheduler.get_jobs()
     for job in scheduled_jobs: 
         if job.meta.get("type") != "offpeak":
             continue
-        worker_scheduler.cancel(job)
-    worker_scheduler.schedule(
+        rq_fast_scheduler.cancel(job)
+    rq_fast_scheduler.schedule(
         scheduled_time=datetime.datetime.utcnow(),
         func=WrappedJob.update_all_jobs_offpeak,
         interval=60,
diff --git a/webinterface/common.py b/webinterface/common.py
index 25a35efd..8604521e 100755
--- a/webinterface/common.py
+++ b/webinterface/common.py
@@ -17,8 +17,12 @@
 from rq_scheduler import Scheduler
 
 redis = Redis()
-worker_queue = Queue(connection=redis)
-worker_scheduler = Scheduler(queue=worker_queue, connection=worker_queue.connection) 
+rq_slow_queue = Queue(name="mercure_slow", connection=redis)
+rq_fast_queue = Queue(name="mercure_fast", connection=redis)
+rq_fast_scheduler = Scheduler(queue=rq_fast_queue, connection=rq_fast_queue.connection) 
+
+
+
 
 def get_user_information(request) -> dict:
     """Returns dictionary of values that should always be passed to the templates when the user is logged in."""
diff --git a/webinterface/dashboards/query/jobs.py b/webinterface/dashboards/query/jobs.py
index 224fe894..3e50ae14 100644
--- a/webinterface/dashboards/query/jobs.py
+++ b/webinterface/dashboards/query/jobs.py
@@ -20,12 +20,9 @@
 
 # App-specific includes
 import common.config as config
-from webinterface.common import worker_queue, redis
-from rq import Connection 
-from rq.job import Dependency, JobStatus
-from rq.job import Job
-from rq import get_current_job
-
+from webinterface.common import redis, rq_fast_queue, rq_slow_queue
+from rq.job import Dependency, JobStatus, Job
+from rq import Connection, Queue, get_current_job
 
 logger = config.get_logger()
 
@@ -58,8 +55,12 @@ class ClassBasedRQJob():
     parent: Optional[str] = None
     type: str = "unknown"
     _job: Optional[Job] = None
+    _queue: str = ''
+
+    @classmethod
+    def queue(cls) -> Queue:
+        return Queue(cls._queue, connection=redis)
 
-    
     def create(self, rq_options={}, **kwargs) -> Job:
         fields = dataclasses.fields(self)
         meta = {field.name: getattr(self, field.name) for field in fields}
@@ -103,8 +104,9 @@ def move_to_destination(path, destination, job_id) -> None:
 @dataclass 
 class CheckAccessionsJob(ClassBasedRQJob):
     type: str = "check_accessions"
-
-    def execute(self, *, accessions: List[str], node: Union[DicomTarget, DicomWebTarget], search_filters:Dict[str,List[str]]={}, queue=worker_queue):
+    _queue: str = rq_fast_queue.name
+    
+    def execute(self, *, accessions: List[str], node: Union[DicomTarget, DicomWebTarget], search_filters:Dict[str,List[str]]={}):
         """
         Check if the given accessions exist on the node using a DICOM query.
         """
@@ -118,46 +120,42 @@ def execute(self, *, accessions: List[str], node: Union[DicomTarget, DicomWebTar
                     raise ValueError("No series found with accession number {}".format(accession))
                 results.extend(found_ds_list)
             return results
-        except ValueError as e:
-            self._job.meta['failed_reason'] = e.args[0]
-            self._job.save_meta()
-            if self.parent and (job_parent := queue.fetch_job(self.parent)):
+        except Exception as e:
+            if not self._job:
+                raise
+            self._job.meta['failed_reason'] = str(e)
+            self._job.save_meta() # type: ignore
+            if self.parent and (job_parent := Job.fetch(self.parent)):
                 job_parent.meta['failed_reason'] = e.args[0]
-                job_parent.save_meta()
-                queue._enqueue_job(job_parent,at_front=True)
+                job_parent.save_meta() # type: ignore
+                Queue(job_parent.origin)._enqueue_job(job_parent,at_front=True)
 
             raise
-        except:
-            self._job.meta['failed_reason'] = f"Unexpected error"
-            self._job.save_meta()
-            if self.parent and (job_parent := queue.fetch_job(self.parent)):
-                job_parent.meta['failed_reason'] = "Unknown"
-                job_parent.save_meta()
-                queue._enqueue_job(job_parent,at_front=True)
-            raise
+
 
 @dataclass
 class GetAccessionJob(ClassBasedRQJob):
     type: str = "get_accession"
     paused: bool = False
     offpeak: bool = False
+    _queue: str = rq_slow_queue.name
 
     @classmethod
     def get_accession(cls, job_id, accession: str, node: Union[DicomTarget, DicomWebTarget], search_filters: Dict[str, List[str]], path) -> Generator[ProgressInfo, None, None]:
         yield from get_handler(node).get_from_target(node, accession, search_filters, path)
 
-    def execute(self, *, accession:str, node: Union[DicomTarget, DicomWebTarget], search_filters:Dict[str, List[str]], path: str, queue=worker_queue):
+    def execute(self, *, accession:str, node: Union[DicomTarget, DicomWebTarget], search_filters:Dict[str, List[str]], path: str):
         print(f"Getting {accession}")
         job = cast(Job,self._job)
         try:
             Path(path).mkdir(parents=True, exist_ok=True)
             job_parent = None
             if parent_id := self.parent:
-                job_parent = queue.fetch_job(parent_id)
+                job_parent = Job.fetch(parent_id)
 
             if job_parent:
                 job_parent.meta['started'] = job_parent.meta.get('started',0) + 1
-                job_parent.save_meta()
+                job_parent.save_meta() # type: ignore
 
             job.meta['started'] = 1
             job.meta['progress'] = "0 / Unknown"
@@ -175,7 +173,7 @@ def execute(self, *, accession:str, node: Union[DicomTarget, DicomWebTarget], se
                 job_parent.get_meta() # there is technically a race condition here...
                 job_parent.meta['completed'] += 1
                 job_parent.meta['progress'] = f"{job_parent.meta['started'] } / {job_parent.meta['completed'] } / {job_parent.meta['total']}"
-                job_parent.save_meta()
+                job_parent.save_meta() # type: ignore
         except:
             if not job_parent:
                 raise
@@ -184,13 +182,13 @@ def execute(self, *, accession:str, node: Union[DicomTarget, DicomWebTarget], se
             for subjob_id in job_parent.kwargs.get('subjobs',[]):
                 if subjob_id == job.id:
                     continue
-                subjob = queue.fetch_job(subjob_id)
+                subjob = Job.fetch(subjob_id)
                 if subjob.get_status() not in ('finished', 'canceled','failed'):
                     subjob.cancel()
             job_parent.get_meta() 
             logger.info("Cancelled sibling jobs.")
             job_parent.meta["failed_reason"] = f"Failed to retrieve {accession}"
-            queue._enqueue_job(job_parent,at_front=True) # Force the parent job to run and fail itself
+            Queue(job_parent.origin)._enqueue_job(job_parent,at_front=True) # Force the parent job to run and fail itself
             raise
 
         return "Job complete"
@@ -203,12 +201,13 @@ class MainJob(ClassBasedRQJob):
     total: int = 0
     paused: bool = False 
     offpeak: bool = False
+    _queue: str = rq_fast_queue.name
 
-    def execute(self, *, accessions, subjobs, path, destination, move_promptly, queue=worker_queue) -> str:
+    def execute(self, *, accessions, subjobs, path, destination, move_promptly) -> str:
         job = cast(Job,self._job)
         job.get_meta()
         for job_id in job.kwargs.get('subjobs',[]):
-            subjob = queue.fetch_job(job_id)
+            subjob = Job.fetch(job_id)
             if (status := subjob.get_status()) != 'finished':
                 raise Exception(f"Subjob {subjob.id} is {status}")
             if job.kwargs.get('failed', False):
@@ -232,22 +231,25 @@ def execute(self, *, accessions, subjobs, path, destination, move_promptly, queu
         return "Job complete"
 
 class WrappedJob():
-    def __init__(self, job: Union[Job,str], queue):
+    job: Job
+    def __init__(self, job: Union[Job,str]):
         if isinstance(job, str):
-            self.job = queue.fetch_job(job)
+            if not (result:=Job.fetch(job)):
+                raise Exception("Invalid Job ID")
+            self.job = result
         else:
             self.job = job
+        
         assert self.job.meta.get('type') == 'batch', f"Job type must be batch, got {self.job.meta['type']}"
-        self.queue = queue
 
     @classmethod
-    def create(cls, accessions, search_filters:Dict[str, List[str]], dicom_node: Union[DicomWebTarget, DicomTarget], destination_path, offpeak=False, queue=worker_queue) -> 'WrappedJob':
+    def create(cls, accessions, search_filters:Dict[str, List[str]], dicom_node: Union[DicomWebTarget, DicomTarget], destination_path, offpeak=False) -> 'WrappedJob':
         """
         Create a job to process the given accessions and store them in the specified destination path.
         """
 
         with Connection(redis):
-            jobs: List[Job] = []
+            get_accession_jobs: List[Job] = []
             check_job = CheckAccessionsJob().create(accessions=accessions, search_filters=search_filters, node=dicom_node)
             for accession in accessions:
                 job = GetAccessionJob(offpeak=offpeak).create(
@@ -260,32 +262,32 @@ def create(cls, accessions, search_filters:Dict[str, List[str]], dicom_node: Uni
                         result_ttl=-1
                         )
                     )
-                jobs.append(job)
+                get_accession_jobs.append(job)
             depends = Dependency(
-                jobs=cast(List[Union[Job,str]],jobs),
+                jobs=cast(List[Union[Job,str]],get_accession_jobs),
                 allow_failure=True,    # allow_failure defaults to False
             )
-            full_job = MainJob(total=len(jobs), offpeak=offpeak).create(
+            full_job = MainJob(total=len(get_accession_jobs), offpeak=offpeak).create(
                 accessions = accessions,
-                subjobs = [j.id for j in jobs],
+                subjobs = [j.id for j in get_accession_jobs],
                 destination = destination_path,
                 move_promptly = True,
                 rq_options = dict(depends_on=depends, timeout=-1, result_ttl=-1)
             )
             check_job.meta["parent"] = full_job.id
-            for j in jobs:
+            for j in get_accession_jobs:
                 j.meta["parent"] = full_job.id
                 j.kwargs["path"] = Path(config.mercure.jobs_folder) / full_job.id / j.kwargs['accession']
                 j.kwargs["path"].mkdir(parents=True)
 
             full_job.kwargs["path"] = Path(config.mercure.jobs_folder) / full_job.id
 
-        queue.enqueue_job(check_job)
-        for j in jobs:
-            queue.enqueue_job(j)
-        queue.enqueue_job(full_job)
+        CheckAccessionsJob.queue().enqueue_job(check_job)
+        for j in get_accession_jobs:
+            GetAccessionJob.queue().enqueue_job(j)
+        MainJob.queue().enqueue_job(full_job)
 
-        wrapped_job = WrappedJob(full_job, queue=queue)
+        wrapped_job = WrappedJob(full_job)
         if offpeak and not _is_offpeak(config.mercure.offpeak_start, config.mercure.offpeak_end, datetime.now().time()):
             wrapped_job.pause()
 
@@ -299,7 +301,7 @@ def pause(self) -> None:
         Pause the current job, including all its subjobs.
         """
         for job_id in self.job.kwargs.get('subjobs',[]):
-            subjob = self.queue.fetch_job(job_id)
+            subjob = Job.fetch(job_id)
             if subjob and (subjob.is_deferred or subjob.is_queued):
                 subjob.meta['paused'] = True
                 subjob.save_meta() # type: ignore
@@ -313,11 +315,11 @@ def resume(self) -> None:
         Resume a paused job by unpausing all its subjobs
         """
         for subjob_id in self.job.kwargs.get('subjobs',[]):
-            subjob = self.job.fetch_job(subjob_id)
+            subjob = Job.fetch(subjob_id)
             if subjob and subjob.meta.get('paused', None):
                 subjob.meta['paused'] = False
                 subjob.save_meta() # type: ignore
-                self.queue.canceled_job_registry.requeue(subjob_id)
+                Queue(subjob.origin).canceled_job_registry.requeue(subjob_id)
         self.job.get_meta()
         self.job.meta['paused'] = False
         self.job.save_meta() # type: ignore
@@ -335,18 +337,18 @@ def retry(self) -> None:
                 logger.info(f"Retrying {subjob}")
                 if status == "failed" and (job_path:=Path(subjob.kwargs['path'])).exists():
                     shutil.rmtree(job_path) # Clean up after a failed job
-                self.queue.enqueue_job(subjob)
-        self.queue.enqueue_job(self.job)
+                Queue(subjob.origin).enqueue_job(subjob)
+        Queue(self.job.origin).enqueue_job(self.job)
 
     @classmethod
-    def update_all_jobs_offpeak(cls,queue=worker_queue) -> None:
+    def update_all_jobs_offpeak(cls) -> None:
         """
         Resume or pause offpeak jobs based on whether the current time is within offpeak hours.
         """
         config.read_config()
         is_offpeak = _is_offpeak(config.mercure.offpeak_start, config.mercure.offpeak_end, datetime.now().time())
         logger.info(f"is_offpeak {is_offpeak}")
-        for job in WrappedJob.get_all_jobs(queue=queue):
+        for job in WrappedJob.get_all_jobs():
             job.update_offpeak(is_offpeak)
 
     def update_offpeak(self, is_offpeak) -> None:
@@ -366,7 +368,7 @@ def update_offpeak(self, is_offpeak) -> None:
                 self.pause()
 
     def get_subjobs(self) -> Generator[Job, None, None]:
-        return (self.queue.fetch_job(job) for job in self.job.kwargs.get('subjobs', []) if job)
+        return (Job.fetch(job) for job in self.job.kwargs.get('subjobs', []) if job)
 
     def get_status(self) -> JobStatus:
         return cast(JobStatus,self.job.get_status())
@@ -411,27 +413,27 @@ def enqueued_at(self) -> datetime:
         return cast(datetime,self.job.enqueued_at)
 
     @classmethod
-    def get_all_jobs(cls, type:str="batch", queue=worker_queue) -> Generator['WrappedJob', None, None]:
+    def get_all_jobs(cls, type:str="batch") -> Generator['WrappedJob', None, None]:
         """
         Get all jobs of a given type from the queue
         """
         registries = [
-            queue.started_job_registry,     # Returns StartedJobRegistry
-            queue.deferred_job_registry,    # Returns DeferredJobRegistry
-            queue.finished_job_registry,    # Returns FinishedJobRegistry
-            queue.failed_job_registry,      # Returns FailedJobRegistry 
-            queue.scheduled_job_registry,   # Returns ScheduledJobRegistry
-            queue.canceled_job_registry,    # Returns CanceledJobRegistry
+            rq_slow_queue.started_job_registry,     # Returns StartedJobRegistry
+            rq_slow_queue.deferred_job_registry,    # Returns DeferredJobRegistry
+            rq_slow_queue.finished_job_registry,    # Returns FinishedJobRegistry
+            rq_slow_queue.failed_job_registry,      # Returns FailedJobRegistry 
+            rq_slow_queue.scheduled_job_registry,   # Returns ScheduledJobRegistry
+            rq_slow_queue.canceled_job_registry,    # Returns CanceledJobRegistry
         ]
         job_ids = set()
         for registry in registries:
             for j_id in registry.get_job_ids():
                 job_ids.add(j_id)
-        for j_id in queue.job_ids:
+        for j_id in rq_slow_queue.job_ids:
             job_ids.add(j_id)
-        jobs = (queue.fetch_job(j_id) for j_id in job_ids)
+        jobs = (Job.fetch(j_id) for j_id in job_ids)
 
-        return (WrappedJob(j,queue) for j in jobs if j and j.get_meta().get("type") == type)
+        return (WrappedJob(j) for j in jobs if j and j.get_meta().get("type") == type)
 
 def _is_offpeak(offpeak_start: str, offpeak_end: str, current_time) -> bool:
     try:
diff --git a/webinterface/dashboards/query_routes.py b/webinterface/dashboards/query_routes.py
index 2d21d1ec..d465f22f 100644
--- a/webinterface/dashboards/query_routes.py
+++ b/webinterface/dashboards/query_routes.py
@@ -14,7 +14,7 @@
 from webinterface.common import templates
 import common.config as config
 from starlette.responses import PlainTextResponse, JSONResponse
-from webinterface.common import worker_queue, redis
+from webinterface.common import redis
 from .common import router
 
 logger = config.get_logger()
@@ -24,14 +24,14 @@
 @router.post("/query/retry_job")
 @requires(["authenticated", "admin"], redirect="login")
 async def post_retry_job(request):
-    job = WrappedJob(request.query_params['id'], queue=worker_queue)
+    job = WrappedJob(request.query_params['id'])
     job.retry()
     return JSONResponse({})
 
 @router.post("/query/pause_job")
 @requires(["authenticated", "admin"], redirect="login")
 async def post_pause_job(request):
-    job = WrappedJob(request.query_params['id'], queue=worker_queue)
+    job = WrappedJob(request.query_params['id'])
     if not job:
         return JSONResponse({'error': 'Job not found'}, status_code=404)
     if job.is_finished or job.is_failed:
@@ -42,7 +42,7 @@ async def post_pause_job(request):
 @router.post("/query/resume_job")
 @requires(["authenticated", "admin"], redirect="login")
 async def post_resume_job(request):
-    job = WrappedJob(request.query_params['id'], queue=worker_queue)
+    job = WrappedJob(request.query_params['id'])
     if not job:
         return JSONResponse({'error': 'Job not found'}, status_code=404)
     if job.is_finished or job.is_failed:
@@ -55,7 +55,7 @@ async def post_resume_job(request):
 @requires(["authenticated", "admin"], redirect="login")
 async def get_job_info(request):
     job_id = request.query_params['id']
-    job = WrappedJob(job_id, queue=worker_queue)
+    job = WrappedJob(job_id)
     if not job:
         return JSONResponse({'error': 'Job not found'}, status_code=404)
     
@@ -187,8 +187,9 @@ async def query(request):
         "page": "query",
     }
     return templates.TemplateResponse(template, context)
-from webinterface.common import worker_queue, redis
-from rq import Connection 
+from webinterface.common import rq_fast_queue, redis
+from rq.job import Job
+from rq import Connection
 
 @router.post("/query/check_accessions")
 @requires(["authenticated", "admin"], redirect="login")
@@ -198,7 +199,7 @@ async def check_accessions(request):
 
     if job_id:
         # Retrieve results for an existing job
-        job = worker_queue.fetch_job(job_id)
+        job = Job.fetch(job_id, redis)
         if not job:
             return JSONResponse({"error": "Job not found"}, status_code=404)
         elif job.is_failed:
@@ -235,5 +236,5 @@ async def check_accessions(request):
     
     with Connection(redis):
         job = CheckAccessionsJob().create(accessions=accessions, node=node, search_filters=search_filters)
-        worker_queue.enqueue_job(job)
+        CheckAccessionsJob.queue().enqueue_job(job)
     return JSONResponse({"status": "pending", "job_id": job.id})
\ No newline at end of file
diff --git a/webinterface/query.py b/webinterface/query.py
index 01e525e5..c2d7e9ed 100644
--- a/webinterface/query.py
+++ b/webinterface/query.py
@@ -221,7 +221,7 @@ def findscu(self,accession_number, search_filters={}) -> List[Dataset]:
                     print('Connection timed out, was aborted or received invalid response')
                     break
 
-                if status.Status in [0xFF00, 0xFF01]:
+                if status.Status in [0xFF00, 0xFF01] and identifier:
                     # print('C-FIND query status: 0x{0:04x}'.format(status.Status))
                     results.append(identifier)
                 # elif status.Status == 0x0000:
@@ -245,4 +245,4 @@ def findscu(self,accession_number, search_filters={}) -> List[Dataset]:
     c = SimpleDicomClient(remote_host, remote_port, called_aet, "/tmp/test-move")
     # study_uid = c.get_study_uid(accession_number)
     # print(study_uid)
-    c.getscu(accession_number)
\ No newline at end of file
+    c.getscu(accession_number, {})
\ No newline at end of file
diff --git a/webinterface/templates/targets/base-test.html b/webinterface/templates/targets/base-test.html
index b75fa2e1..c34c8067 100644
--- a/webinterface/templates/targets/base-test.html
+++ b/webinterface/templates/targets/base-test.html
@@ -1,5 +1,5 @@
 {% for r in result %}
 <div style="margin-bottom: 8px;">
-    <i class="fas {% if result[r] %}fa-check-circle{% else %}fa-times-circle{% endif %} fa-lg has-text-{% if result[r] %}success{% else %}danger{% endif %} "></i>&nbsp;&nbsp;{{r}}  {{ result[r] if (result[r] not in (True, False)) else ''}}
+    <i class="fas {% if result[r] == True %}fa-check-circle{% else %}fa-times-circle{% endif %} fa-lg has-text-{% if result[r] == True %}success{% else %}danger{% endif %} "></i>&nbsp;&nbsp;{{r}}  {{ result[r] if (result[r] not in (True, False)) else ''}}
 </div>
 {% endfor %}
\ No newline at end of file

From 98a65a05fc13e4911f46f4320f657a588ca0a06c Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 6 Sep 2024 23:50:36 +0000
Subject: [PATCH 32/42] show worker logs

---
 configuration/default_services.json |   5 ++
 installation/mercure-sudoer         |   5 ++
 webgui.py                           | 102 ++++++++++++++++++++--------
 webinterface/templates/logs.html    |  13 +++-
 4 files changed, 94 insertions(+), 31 deletions(-)

diff --git a/configuration/default_services.json b/configuration/default_services.json
index 8e6458f6..a2adc98d 100755
--- a/configuration/default_services.json
+++ b/configuration/default_services.json
@@ -28,5 +28,10 @@
         "name": "Bookkeeper",
         "systemd_service": "mercure_bookkeeper.service",
         "docker_service": "mercure_bookkeeper_1"
+    },
+    "workers": {
+        "name": "Workers",
+        "systemd_service": ["mercure_worker_fast@1.service", "mercure_worker_fast@2.service", "mercure_worker_slow@1.service", "mercure_worker_slow@2.service"],
+        "docker_service": ["mercure_worker_fast_1", "mercure_worker_fast_2", "mercure_worker_slow_1", "mercure_worker_slow_2"]
     }
 }
diff --git a/installation/mercure-sudoer b/installation/mercure-sudoer
index 7cae2299..63a291c9 100644
--- a/installation/mercure-sudoer
+++ b/installation/mercure-sudoer
@@ -5,3 +5,8 @@ mercure ALL=(ALL) NOPASSWD: /bin/journalctl -n 1000 -u mercure_receiver.service,
 mercure ALL=(ALL) NOPASSWD: /bin/journalctl -n 1000 -u mercure_router.service, /bin/journalctl -n 1000 -u mercure_router.service *,/bin/systemctl start mercure_router.service, /bin/systemctl stop mercure_router.service, /bin/systemctl restart mercure_router.service, /bin/systemctl kill mercure_router
 mercure ALL=(ALL) NOPASSWD: /bin/journalctl -n 1000 -u mercure_ui.service, /bin/journalctl -n 1000 -u mercure_ui.service *,/bin/systemctl start mercure_ui.service, /bin/systemctl stop mercure_ui.service, /bin/systemctl restart mercure_ui.service, /bin/systemctl kill mercure_ui
 mercure ALL=(ALL) NOPASSWD: /bin/journalctl -n 1000 -u mercure_processor.service, /bin/journalctl -n 1000 -u mercure_processor.service *,/bin/systemctl start mercure_processor.service, /bin/systemctl stop mercure_processor.service, /bin/systemctl restart mercure_processor.service, /bin/systemctl kill mercure_processor
+
+mercure ALL=(ALL) NOPASSWD: /bin/journalctl -n 1000 -u mercure_worker_slow@?.service, /bin/journalctl -n 1000 -u mercure_worker_slow@?.service *,/bin/systemctl start mercure_worker_slow@?.service, /bin/systemctl stop mercure_worker_slow@?.service, /bin/systemctl restart mercure_worker_slow@?.service, /bin/systemctl kill mercure_worker_slow@?.service
+mercure ALL=(ALL) NOPASSWD: /bin/journalctl -n 1000 -u mercure_worker_slow@??.service, /bin/journalctl -n 1000 -u mercure_worker_slow@??.service *,/bin/systemctl start mercure_worker_slow@??.service, /bin/systemctl stop mercure_worker_slow@??.service, /bin/systemctl restart mercure_worker_slow@??.service, /bin/systemctl kill mercure_worker_slow@??.service
+mercure ALL=(ALL) NOPASSWD: /bin/journalctl -n 1000 -u mercure_worker_fast@?.service, /bin/journalctl -n 1000 -u mercure_worker_fast@?.service *,/bin/systemctl start mercure_worker_fast@?.service, /bin/systemctl stop mercure_worker_fast@?.service, /bin/systemctl restart mercure_worker_fast@?.service, /bin/systemctl kill mercure_worker_fast@?.service
+mercure ALL=(ALL) NOPASSWD: /bin/journalctl -n 1000 -u mercure_worker_fast@??.service, /bin/journalctl -n 1000 -u mercure_worker_fast@??.service *,/bin/systemctl start mercure_worker_fast@??.service, /bin/systemctl stop mercure_worker_fast@??.service, /bin/systemctl restart mercure_worker_fast@??.service, /bin/systemctl kill mercure_worker_fast@??.service
diff --git a/webgui.py b/webgui.py
index 43688dc9..c1d68528 100755
--- a/webgui.py
+++ b/webgui.py
@@ -272,6 +272,7 @@ async def show_log(request) -> Response:
             return_code = 0
         except:
             pass
+        sub_services = []
     elif runtime == "systemd":
         start_date_cmd = ""
         end_date_cmd = ""
@@ -280,20 +281,37 @@ async def show_log(request) -> Response:
         if end_timestamp:
             end_date_cmd = f'--until "{end_timestamp}"'
 
+        service_name_or_list = services.services_list[requested_service]["systemd_service"]
+        if isinstance(service_name_or_list, list):
+            service_name = request.query_params.get("subservice", service_name_or_list[0])
+            sub_services = service_name_or_list
+        else:
+            service_name = service_name_or_list
+            sub_services = []
         run_result = await async_run(
             f"sudo journalctl -n 1000 -u "
-            f'{services.services_list[requested_service]["systemd_service"]} '
+            f'{service_name} '
             f"{start_date_cmd} {end_date_cmd}"
         )
         return_code = -1 if run_result[0] is None else run_result[0]
         raw_logs = run_result[1]
+
     elif runtime == "docker":
         client = docker.from_env() # type: ignore
         try:
-            container = client.containers.get(services.services_list[requested_service]["docker_service"])
+            service_name_or_list = services.services_list[requested_service]["systemd_service"]
+            if isinstance(service_name_or_list, list):
+                service_name = request.query_params.get("subservice", service_name_or_list[0])
+                sub_services = service_name_or_list
+            else:
+                service_name = service_name_or_list
+                sub_services = []
+
+            container = client.containers.get(service_name)
             container.reload()
             raw_logs = container.logs(since=start_obj)
             return_code = 0
+            sub_services = services.services_list[requested_service]["docker_service"]
         except (docker.errors.NotFound, docker.errors.APIError): # type: ignore
             return_code = 1
 
@@ -326,6 +344,8 @@ async def show_log(request) -> Response:
         "end_time": end_time,
         "end_time_available": runtime == "systemd",
         "start_time_available": runtime in ("docker", "systemd"),
+        "sub_services": sub_services,
+        "subservice": request.query_params.get("subservice", None)
     }
     return templates.TemplateResponse(template, context)
 
@@ -688,18 +708,32 @@ async def homepage(request) -> Response:
         running_status: Optional[bool] = False
 
         if runtime == "systemd":
-            if (await async_run("systemctl is-active " + services.services_list[service]["systemd_service"]))[0] == 0:
-                running_status = True
+            systemd_services = services.services_list[service]["systemd_service"]
+            if not isinstance(systemd_services, list):
+                systemd_services = [systemd_services]
+
+            for service_name in systemd_services:
+                exit_code, _, _ = await async_run(f"systemctl is-active {service_name}")
+                if exit_code == 0:
+                    running_status = True
+                else:
+                    running_status = False
+                    break
 
         elif runtime == "docker":
             client = docker.from_env() # type: ignore
+            docker_services = services.services_list[service]["docker_service"]
+            if not isinstance(docker_services, list):
+                docker_services = [docker_services]
+
             try:
-                container = client.containers.get(services.services_list[service]["docker_service"])
-                container.reload()
-                status = container.status
-                """restarting, running, paused, exited"""
-                if status == "running":
-                    running_status = True
+                for service in docker_services:
+                    container = client.containers.get(service)
+                    container.reload()
+                    status = container.status
+                    """restarting, running, paused, exited"""
+                    if status == "running":
+                        running_status = True
 
             except (docker.errors.NotFound, docker.errors.APIError): # type: ignore
                 running_status = False
@@ -715,8 +749,9 @@ async def homepage(request) -> Response:
                     alloc = running_alloc[0]
                     if not alloc["TaskStates"].get(service):
                         running_status = False
-                    else:
+                    else: # TODO: fix this for workers?
                         running_status = alloc["TaskStates"][service]["State"] == "running"
+
         service_status[service] = {
             "id": service,
             "name": services.services_list[service]["name"],
@@ -761,27 +796,36 @@ async def control_services(request) -> Response:
                 continue
 
             if runtime == "systemd":
-                command = "sudo systemctl " + action + " " + services.services_list[service]["systemd_service"]
-                logger.info(f"Executing: {command}")
-                await async_run(command)
+                systemd_services = services.services_list[service]["systemd_service"]
+                if not isinstance(systemd_services, list):
+                    systemd_services = [systemd_services]
+
+                for service_name in systemd_services:
+                    command = "sudo systemctl " + action + " " + service_name
+                    logger.info(f"Executing: {command}")
+                    await async_run(command)
 
             elif runtime == "docker":
                 client = docker.from_env() # type: ignore
-                logger.info(f'Executing: {action} on {services.services_list[service]["docker_service"]}')
-                try:
-                    container = client.containers.get(services.services_list[service]["docker_service"])
-                    container.reload()
-                    if action == "start":
-                        container.start()
-                    if action == "stop":
-                        container.stop()
-                    if action == "restart":
-                        container.restart()
-                    if action == "kill":
-                        container.kill()
-                except (docker.errors.NotFound, docker.errors.APIError) as docker_error: # type: ignore
-                    logger.error(f"{docker_error}")
-                    pass
+                docker_services = services.services_list[service]["docker_service"]
+                if not isinstance(docker_services, list):
+                    docker_services = [docker_services]
+                for service_name in docker_services:
+                    logger.info(f'Executing: {action} on {service_name}')
+                    try:
+                        container = client.containers.get(service_name)
+                        container.reload()
+                        if action == "start":
+                            container.start()
+                        if action == "stop":
+                            container.stop()
+                        if action == "restart":
+                            container.restart()
+                        if action == "kill":
+                            container.kill()
+                    except (docker.errors.NotFound, docker.errors.APIError) as docker_error: # type: ignore
+                        logger.error(f"{docker_error}")
+                        pass
 
             else:
                 # The Nomad mode currently does not support shutting down services
diff --git a/webinterface/templates/logs.html b/webinterface/templates/logs.html
index a56f7d16..938457b6 100755
--- a/webinterface/templates/logs.html
+++ b/webinterface/templates/logs.html
@@ -35,11 +35,20 @@ <h1 class="title">Logs</h1>
         <ul>
           {% for service in service_logs %}
           <li title="{{service_logs[service]['systemd']}}" {% if service_logs[service]['id']==log_id %}class="is-active"
-            {% endif %}><a href="/logs/{{service_logs[service]['id']}}">{{
-              service_logs[service]['name'] }}</a></li>
+            {% endif %}><a href="/logs/{{service_logs[service]['id']}}">{{service_logs[service]['name'] }}</a></li>
           {% endfor %}
         </ul>
       </div>
+      {% if sub_services %}
+      <div class="logtabs tabs">
+        <ul>
+          {% for service in sub_services %}
+          <li title="service" {% if subservice==service %}class="is-active"{% endif %}>
+            <a href="/logs/{{log_id}}?subservice={{service}}">{{service }}</a></li>
+          {% endfor %}
+        </ul>
+      </div>
+      {% endif %}
       <div class="logview">
         <p class="logviewer" id="logviewdiv">
           {{log_content|safe}}

From e6d2bc83a6f1da19131bae81538099eefa35c0be Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Tue, 10 Sep 2024 21:28:57 +0000
Subject: [PATCH 33/42] various work on docker version

---
 common/helper.py                           |  15 ++-
 dispatch/target_types/builtin.py           |   2 +-
 docker/base/Dockerfile                     |   3 +-
 docker/docker-compose.yml                  |  30 ++++-
 docker/worker/Dockerfile                   |   4 +
 install.sh                                 |   3 +
 requirements.in                            |   1 +
 requirements.txt                           |   8 +-
 tests/test_query.py                        |   2 +-
 webgui.py                                  | 128 ++++++++++++---------
 webinterface/common.py                     |   8 +-
 webinterface/dashboards/query_routes.py    |   6 +-
 webinterface/{query.py => dicom_client.py} |   0
 webinterface/templates/index.html          |  15 ++-
 14 files changed, 148 insertions(+), 77 deletions(-)
 create mode 100644 docker/worker/Dockerfile
 rename webinterface/{query.py => dicom_client.py} (100%)

diff --git a/common/helper.py b/common/helper.py
index e0cbb536..6f0ca221 100755
--- a/common/helper.py
+++ b/common/helper.py
@@ -5,15 +5,13 @@
 """
 # Standard python includes
 import asyncio
-from contextlib import suppress
 from datetime import datetime
 from datetime import time as _time
 import inspect
 from pathlib import Path
 import threading
-from typing import Callable, Optional
+from typing import Callable, Optional, Tuple
 import graphyte
-import aiohttp
 import os
 import common.influxdb
 
@@ -23,6 +21,15 @@
 
 loop = asyncio.get_event_loop()
 
+def validate_folders(config) -> Tuple[bool, str]:
+    for folder in ( config.incoming_folder, config.studies_folder, config.outgoing_folder,
+                    config.success_folder, config.error_folder, config.discard_folder,
+                    config.processing_folder, config.jobs_folder ):
+        if not Path(folder).is_dir():
+            return False, f"Folder {folder} does not exist."
+        if not os.access( folder, os.R_OK | os.W_OK ):
+            return False, f"No read/write access to {folder}"
+    return True, ""
 
 def get_runner() -> str:
     """Returns the name of the mechanism that is used for running mercure in the current installation (systemd, docker, nomad)."""
@@ -113,6 +120,8 @@ async def _run(self) -> None:
 
     def run_until_complete(self, loop=None) -> None:
         self.start()
+        if not self._task:
+            raise Exception("Unexpected error: AsyncTimer._task is None")
         loop = loop or asyncio.get_event_loop()
         loop.run_until_complete(self._task)
 
diff --git a/dispatch/target_types/builtin.py b/dispatch/target_types/builtin.py
index 9d92b62c..199120da 100644
--- a/dispatch/target_types/builtin.py
+++ b/dispatch/target_types/builtin.py
@@ -13,7 +13,7 @@
 
 from starlette.responses import JSONResponse
 
-from webinterface.query import DicomClientCouldNotFind, SimpleDicomClient
+from webinterface.dicom_client import DicomClientCouldNotFind, SimpleDicomClient
 
 from .registry import handler_for
 from .base import ProgressInfo, SubprocessTargetHandler, TargetHandler
diff --git a/docker/base/Dockerfile b/docker/base/Dockerfile
index d3882eef..5ca6ec27 100755
--- a/docker/base/Dockerfile
+++ b/docker/base/Dockerfile
@@ -31,7 +31,8 @@ RUN chmod -R o+rx /opt/mercure/app && \
           /opt/mercure/data/success \
           /opt/mercure/data/error \
           /opt/mercure/data/discard \
-          /opt/mercure/data/processing && \
+          /opt/mercure/data/processing \
+          /opt/mercure/data/jobs && \
     chown -R mercure /opt/mercure/data
 # Export the configuration and data folder as a volume, as multiple scripts will have to read/write there
 VOLUME /opt/mercure/config
diff --git a/docker/docker-compose.yml b/docker/docker-compose.yml
index 1e6163cf..8a79fb2a 100755
--- a/docker/docker-compose.yml
+++ b/docker/docker-compose.yml
@@ -2,7 +2,7 @@ version: "3.9"
 x-env: &env
   environment:
     MERCURE_RUNNER: docker
-
+    REDIS_URL: redis://redis:6379/0
 x-volumes: &volumes
   volumes:
     - config:/opt/mercure/config
@@ -24,6 +24,7 @@ services:
     depends_on:
       db:
         condition: service_healthy
+      redis:
     image: mercureimaging/mercure-ui${IMAGE_TAG}
     restart: always
     ports:
@@ -107,6 +108,33 @@ services:
         condition: service_healthy
     <<: *volumes
     <<: *env
+  
+  redis:
+    <<: *user
+    image: redis
+    restart: always
+
+  worker_fast:
+    <<: *user
+    image: mercureimaging/mercure-worker${IMAGE_TAG}
+    restart: always
+    deploy:
+      replicas: 2
+    environment:
+      WORKER_QUEUE: mercure_fast
+      REDIS_URL: redis://redis:6379/0
+    <<: *volumes
+
+  worker_slow:
+    <<: *user
+    image: mercureimaging/mercure-worker${IMAGE_TAG}
+    restart: always
+    deploy:
+      replicas: 2
+    environment:
+      WORKER_QUEUE: mercure_slow
+      REDIS_URL: redis://redis:6379/0
+    <<: *volumes
 
 volumes:
   db-data:
diff --git a/docker/worker/Dockerfile b/docker/worker/Dockerfile
new file mode 100644
index 00000000..7961aae7
--- /dev/null
+++ b/docker/worker/Dockerfile
@@ -0,0 +1,4 @@
+ARG VERSION_TAG=latest
+ARG IMAGE_NAME=mercureimaging/mercure-base
+FROM $IMAGE_NAME:$VERSION_TAG
+CMD /opt/mercure/env/bin/rq worker $WORKER_QUEUE --url $REDIS_URL --with-scheduler
diff --git a/install.sh b/install.sh
index b75dda8f..78e72965 100755
--- a/install.sh
+++ b/install.sh
@@ -380,6 +380,9 @@ install_services() {
   sudo cp "$MERCURE_SRC"/installation/*.service /etc/systemd/system
   sudo systemctl enable mercure_bookkeeper.service mercure_cleaner.service mercure_dispatcher.service mercure_receiver.service mercure_router.service mercure_ui.service mercure_processor.service
   sudo systemctl start mercure_bookkeeper.service mercure_cleaner.service mercure_dispatcher.service mercure_receiver.service mercure_router.service mercure_ui.service mercure_processor.service
+
+  sudo systemctl enable mercure_worker_fast@1.service mercure_worker_fast@2.service mercure_worker_slow@1.service mercure_worker_slow@2.service
+  sudo systemctl start mercure_worker_fast@1.service mercure_worker_fast@2.service mercure_worker_slow@1.service mercure_worker_slow@2.service
 }
 
 systemd_install () {
diff --git a/requirements.in b/requirements.in
index e5fa4ddd..ea293b9f 100644
--- a/requirements.in
+++ b/requirements.in
@@ -52,6 +52,7 @@ python-nomad
 
 # other
 pydicom ~= 2.4.1
+pynetdicom ~= 2.0.2
 pydantic >= 1.10.9, <2.0.0
 pillow >= 10.0.1
 dicomweb-client
diff --git a/requirements.txt b/requirements.txt
index a7b9261b..31d7aedf 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -158,10 +158,13 @@ pydicom==2.4.4
     # via
     #   -r requirements.in
     #   dicomweb-client
+    #   pynetdicom
 pyfakefs==4.5.6
     # via -r requirements.in
 pygments==2.18.0
     # via sphinx
+pynetdicom==2.0.2
+    # via -r requirements.in
 pytest==8.2.2
     # via
     #   -r requirements.in
@@ -206,8 +209,6 @@ rq-scheduler==0.13.1
     # via -r requirements.in
 s3transfer==0.10.0
     # via boto3
-setuptools==70.0.0
-    # via influxdb-client
 six==1.16.0
     # via
     #   python-dateutil
@@ -287,3 +288,6 @@ wheel==0.43.0
     # via -r requirements.in
 yarl==1.9.4
     # via aiohttp
+
+# The following packages are considered to be unsafe in a requirements file:
+# setuptools
diff --git a/tests/test_query.py b/tests/test_query.py
index 93e71293..1b514dfd 100644
--- a/tests/test_query.py
+++ b/tests/test_query.py
@@ -10,7 +10,7 @@
 from pydicom.dataset import Dataset, FileMetaDataset
 from rq import Worker
 from webinterface.dashboards.query.jobs import GetAccessionJob, WrappedJob
-from webinterface.query import SimpleDicomClient
+from webinterface.dicom_client import SimpleDicomClient
 
 from common.types import DicomTarget, DicomWebTarget
 from webinterface.common import redis
diff --git a/webgui.py b/webgui.py
index c1d68528..6dbdd435 100755
--- a/webgui.py
+++ b/webgui.py
@@ -26,7 +26,7 @@
 import daiquiri
 import html
 from pathlib import Path
-from typing import Any, Optional, Union
+from typing import Any, Dict, List, Optional, Union
 import docker
 import hupper
 import nomad
@@ -678,6 +678,68 @@ async def settings_edit(request) -> Response:
 ## Homepage endpoints
 ###################################################################################
 
+async def get_service_status(runtime) -> List[Dict[str, Any]]:
+    service_status = {service: {
+            "id": service,
+            "name": value["name"],
+            "running": None
+    } for service, value in services.services_list.items()}
+    logger.warning(service_status)
+    logger.warning(services.services_list)
+    try:
+        for service_id, service_info in services.services_list.items():
+            running_status: Optional[bool] = False
+
+            if runtime == "systemd":
+                systemd_services = service_info["systemd_service"]
+                if not isinstance(systemd_services, list):
+                    systemd_services = [systemd_services]
+
+                for service_name in systemd_services:
+                    exit_code, _, _ = await async_run(f"systemctl is-active {service_name}")
+                    if exit_code == 0:
+                        running_status = True
+                    else:
+                        running_status = False
+                        break
+
+            elif runtime == "docker":
+                client = docker.from_env() # type: ignore
+                docker_services = service_info["docker_service"]
+                if not isinstance(docker_services, list):
+                    docker_services = [docker_services]
+
+                try:
+                    for docker_service in docker_services:
+                        container = client.containers.get(docker_service)
+                        container.reload()
+                        status = container.status
+                        """restarting, running, paused, exited"""
+                        if status == "running":
+                            running_status = True
+
+                except (docker.errors.NotFound, docker.errors.APIError): # type: ignore
+                    running_status = False
+            elif runtime == "nomad":
+                if nomad_connection is None:
+                    running_status = None
+                else:
+                    allocations = nomad_connection.job.get_allocations("mercure")
+                    running_alloc = [a for a in allocations if a["ClientStatus"] == "running"]
+                    if not running_alloc:
+                        running_status = False
+                    else:
+                        alloc = running_alloc[0]
+                        if not alloc["TaskStates"].get(service_id):
+                            running_status = False
+                        else: # TODO: fix this for workers?
+                            running_status = alloc["TaskStates"][service_id]["State"] == "running"
+
+            service_status[service_id].running = running_status
+    except:
+        logger.exception("Failed to get service status.")
+    finally:
+        return service_status.values()
 
 @router.get("/")
 @requires("authenticated", redirect="login")
@@ -703,60 +765,11 @@ async def homepage(request) -> Response:
         free_space = "N/A"
         disk_total = "N/A"
 
-    service_status = {}
-    for service in services.services_list:
-        running_status: Optional[bool] = False
-
-        if runtime == "systemd":
-            systemd_services = services.services_list[service]["systemd_service"]
-            if not isinstance(systemd_services, list):
-                systemd_services = [systemd_services]
-
-            for service_name in systemd_services:
-                exit_code, _, _ = await async_run(f"systemctl is-active {service_name}")
-                if exit_code == 0:
-                    running_status = True
-                else:
-                    running_status = False
-                    break
-
-        elif runtime == "docker":
-            client = docker.from_env() # type: ignore
-            docker_services = services.services_list[service]["docker_service"]
-            if not isinstance(docker_services, list):
-                docker_services = [docker_services]
-
-            try:
-                for service in docker_services:
-                    container = client.containers.get(service)
-                    container.reload()
-                    status = container.status
-                    """restarting, running, paused, exited"""
-                    if status == "running":
-                        running_status = True
-
-            except (docker.errors.NotFound, docker.errors.APIError): # type: ignore
-                running_status = False
-        elif runtime == "nomad":
-            if nomad_connection is None:
-                running_status = None
-            else:
-                allocations = nomad_connection.job.get_allocations("mercure")
-                running_alloc = [a for a in allocations if a["ClientStatus"] == "running"]
-                if not running_alloc:
-                    running_status = False
-                else:
-                    alloc = running_alloc[0]
-                    if not alloc["TaskStates"].get(service):
-                        running_status = False
-                    else: # TODO: fix this for workers?
-                        running_status = alloc["TaskStates"][service]["State"] == "running"
-
-        service_status[service] = {
-            "id": service,
-            "name": services.services_list[service]["name"],
-            "running": running_status,
-        }
+    try:
+        service_status = await get_service_status(runtime)
+    except Exception as e:
+        logger.error(f"Error getting service status: {e}")
+        service_status = {}
 
     template = "index.html"
     context = {
@@ -927,8 +940,11 @@ def main(args=sys.argv[1:]) -> None:
         logging.getLogger("watchdog").setLevel(logging.WARNING)
     try:
         services.read_services()
-        config.read_config()
+        config_ = config.read_config()
         users.read_users()
+        success, error = helper.validate_folders(config_)
+        if not success:
+            raise ValueError(f"Invalid configuration folder structure: {error}")
         if str(SECRET_KEY) == "PutSomethingRandomHere":
             logger.error("You need to change the SECRET_KEY in configuration/webgui.env")
             raise Exception("Invalid or missing SECRET_KEY in webgui.env")
diff --git a/webinterface/common.py b/webinterface/common.py
index 8604521e..5836801c 100755
--- a/webinterface/common.py
+++ b/webinterface/common.py
@@ -5,10 +5,11 @@
 """
 
 # Standard python includes
+import os
 from typing import Optional, Tuple
 import asyncio
 from redis import Redis
-from rq import Queue, Connection
+from rq import Queue
 
 # Starlette-related includes
 from starlette.templating import Jinja2Templates
@@ -16,14 +17,11 @@
 from common.constants import mercure_defs
 from rq_scheduler import Scheduler
 
-redis = Redis()
+redis = Redis.from_url(os.getenv("REDIS_URL","http://localhost:6379/0"))
 rq_slow_queue = Queue(name="mercure_slow", connection=redis)
 rq_fast_queue = Queue(name="mercure_fast", connection=redis)
 rq_fast_scheduler = Scheduler(queue=rq_fast_queue, connection=rq_fast_queue.connection) 
 
-
-
-
 def get_user_information(request) -> dict:
     """Returns dictionary of values that should always be passed to the templates when the user is logged in."""
     return {
diff --git a/webinterface/dashboards/query_routes.py b/webinterface/dashboards/query_routes.py
index d465f22f..4de0711b 100644
--- a/webinterface/dashboards/query_routes.py
+++ b/webinterface/dashboards/query_routes.py
@@ -15,6 +15,9 @@
 import common.config as config
 from starlette.responses import PlainTextResponse, JSONResponse
 from webinterface.common import redis
+from rq.job import Job
+from rq import Connection
+
 from .common import router
 
 logger = config.get_logger()
@@ -187,9 +190,6 @@ async def query(request):
         "page": "query",
     }
     return templates.TemplateResponse(template, context)
-from webinterface.common import rq_fast_queue, redis
-from rq.job import Job
-from rq import Connection
 
 @router.post("/query/check_accessions")
 @requires(["authenticated", "admin"], redirect="login")
diff --git a/webinterface/query.py b/webinterface/dicom_client.py
similarity index 100%
rename from webinterface/query.py
rename to webinterface/dicom_client.py
diff --git a/webinterface/templates/index.html b/webinterface/templates/index.html
index 79f1398c..d292abbc 100755
--- a/webinterface/templates/index.html
+++ b/webinterface/templates/index.html
@@ -16,15 +16,18 @@ <h5 class="title is-5 configtitle" style="margin-top: 34px; margin-bottom: 4px !
           {% for service in service_status %}
           <div class="control">
             <div class="tags has-addons">
-              <span class="tag is-dark">{{ service_status[service]['name'] }}</span>
-              <span {% if service_status[service]['running'] == True %} class="tag is-success">
+              <span class="tag is-dark">{{ service['name'] }}</span>
+              <span {% if service['running'] == True %} class="tag is-success">
                 UP
-                {% elif service_status[service]['running'] == False %} class="tag is-danger">DOWN
+                {% elif service['running'] == False %} class="tag is-danger">DOWN
                 {% else %} class="tag">UNKNOWN
                 {% endif %}</span>
             </div>
           </div>
           {% endfor %}
+          {% if users|selectattr("running", "boolean")|list|length == 0 %}
+            Unable to retrieve service statuses, possible permissions issue. Please check the logs. {% if is_admin %} Service control probably does not function. {% endif %}
+          {% endif %}
         </div>
         <h5 class="title is-5 configtitle" style="margin-top: 40px; margin-bottom: 0px !important;"><i
             class="fas fa-heartbeat has-text-success"></i>&nbsp;&nbsp;Server Health</h5>
@@ -62,7 +65,7 @@ <h5 class="title is-5 configtitle" style="margin-top: 40px; margin-bottom: 0px !
           <div class="control select is-multiple is-fullwidth">
             <select name='services[]' multiple size="6" id="controlserviceselector">
               {% for service in service_status %}
-              <option {% if loop.index> 1 %}selected{% endif %} value="{{service}}">{{service_status[service]['name']}}
+              <option {% if loop.index> 1 %}selected{% endif %} value="{{service["id"]}}">{{service['name']}}
               </option>
               {% endfor %}
             </select>
@@ -122,6 +125,10 @@ <h5 class="title is-5 configtitle" style="margin-top: 40px; margin-bottom: 0px !
           clearTimeout(pageloaderTimeout);
           location.reload();
         }, 2000);
+      },
+      error: function (data) {
+        $("#controlpageloader").removeClass('is-active');
+        alert('An error occurred while trying to execute the action.')
       }
     });
   })

From faea11d3ec567af50044da3288b1f8b1b88c863d Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Tue, 10 Sep 2024 22:42:22 +0000
Subject: [PATCH 34/42] fixes

---
 build-docker.sh                         |  2 +-
 docker/docker-compose.override.yml      |  1 +
 docker/docker-compose.yml               | 10 ++++++++++
 webgui.py                               |  8 ++++----
 webinterface/dashboards/query_routes.py |  5 ++++-
 webinterface/templates/index.html       |  3 ---
 6 files changed, 20 insertions(+), 9 deletions(-)

diff --git a/build-docker.sh b/build-docker.sh
index 75a7d189..4bae6070 100755
--- a/build-docker.sh
+++ b/build-docker.sh
@@ -84,7 +84,7 @@ build_component () {
 
 docker build $CACHE -t $PREFIX/mercure-base:$TAG -t $PREFIX/mercure-base:latest -f docker/base/Dockerfile .
 
-for component in ui bookkeeper receiver router processor dispatcher cleaner
+for component in ui bookkeeper receiver router processor dispatcher cleaner worker
 do
   build_component $component
 done
diff --git a/docker/docker-compose.override.yml b/docker/docker-compose.override.yml
index 185637a2..50298139 100755
--- a/docker/docker-compose.override.yml
+++ b/docker/docker-compose.override.yml
@@ -4,6 +4,7 @@ x-env: &env
     MERCURE_RUNNER: docker
     MERCURE_ENV: DEV
     MERCURE_CONFIG_FOLDER: /opt/mercure/config
+    REDIS_URL: http://redis:6379/0
 
 x-volumes: &volumes
   volumes:
diff --git a/docker/docker-compose.yml b/docker/docker-compose.yml
index 8a79fb2a..a5ee2fce 100755
--- a/docker/docker-compose.yml
+++ b/docker/docker-compose.yml
@@ -25,6 +25,12 @@ services:
       db:
         condition: service_healthy
       redis:
+        condition: service_started
+      worker_fast:
+        condition: service_started
+      worker_slow:
+        condition: service_started
+      
     image: mercureimaging/mercure-ui${IMAGE_TAG}
     restart: always
     ports:
@@ -118,6 +124,8 @@ services:
     <<: *user
     image: mercureimaging/mercure-worker${IMAGE_TAG}
     restart: always
+    depends_on:
+      - redis
     deploy:
       replicas: 2
     environment:
@@ -129,6 +137,8 @@ services:
     <<: *user
     image: mercureimaging/mercure-worker${IMAGE_TAG}
     restart: always
+    depends_on:
+      - redis
     deploy:
       replicas: 2
     environment:
diff --git a/webgui.py b/webgui.py
index 6dbdd435..4d732825 100755
--- a/webgui.py
+++ b/webgui.py
@@ -299,7 +299,7 @@ async def show_log(request) -> Response:
     elif runtime == "docker":
         client = docker.from_env() # type: ignore
         try:
-            service_name_or_list = services.services_list[requested_service]["systemd_service"]
+            service_name_or_list = services.services_list[requested_service]["docker_service"]
             if isinstance(service_name_or_list, list):
                 service_name = request.query_params.get("subservice", service_name_or_list[0])
                 sub_services = service_name_or_list
@@ -311,8 +311,8 @@ async def show_log(request) -> Response:
             container.reload()
             raw_logs = container.logs(since=start_obj)
             return_code = 0
-            sub_services = services.services_list[requested_service]["docker_service"]
-        except (docker.errors.NotFound, docker.errors.APIError): # type: ignore
+        except (docker.errors.NotFound, docker.errors.APIError) as e: # type: ignore
+            logger.error(e)
             return_code = 1
 
     # return_code, raw_logs = (await async_run("/usr/bin/nomad alloc logs -job -stderr -f -tail mercure router"))[:2]
@@ -735,7 +735,7 @@ async def get_service_status(runtime) -> List[Dict[str, Any]]:
                         else: # TODO: fix this for workers?
                             running_status = alloc["TaskStates"][service_id]["State"] == "running"
 
-            service_status[service_id].running = running_status
+            service_status[service_id]["running"] = running_status
     except:
         logger.exception("Failed to get service status.")
     finally:
diff --git a/webinterface/dashboards/query_routes.py b/webinterface/dashboards/query_routes.py
index 4de0711b..24fa7e19 100644
--- a/webinterface/dashboards/query_routes.py
+++ b/webinterface/dashboards/query_routes.py
@@ -137,7 +137,10 @@ async def query_jobs(request):
     Returns a list of all query jobs. 
     """
     job_info = []
-    for job in WrappedJob.get_all_jobs():
+    with Connection(redis):
+        jobs = list(WrappedJob.get_all_jobs())
+
+    for job in jobs:
         job_dict = dict(id=job.id, 
                                 status=job.get_status(), 
                                 parameters=dict(accession=job.kwargs.get('accession','')), 
diff --git a/webinterface/templates/index.html b/webinterface/templates/index.html
index d292abbc..ead34b81 100755
--- a/webinterface/templates/index.html
+++ b/webinterface/templates/index.html
@@ -25,9 +25,6 @@ <h5 class="title is-5 configtitle" style="margin-top: 34px; margin-bottom: 4px !
             </div>
           </div>
           {% endfor %}
-          {% if users|selectattr("running", "boolean")|list|length == 0 %}
-            Unable to retrieve service statuses, possible permissions issue. Please check the logs. {% if is_admin %} Service control probably does not function. {% endif %}
-          {% endif %}
         </div>
         <h5 class="title is-5 configtitle" style="margin-top: 40px; margin-bottom: 0px !important;"><i
             class="fas fa-heartbeat has-text-success"></i>&nbsp;&nbsp;Server Health</h5>

From dc96c13ba258b5dfd440f9a2057b2cee2026a116 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Thu, 12 Sep 2024 19:06:18 +0000
Subject: [PATCH 35/42] update starlette and uvicorn handle redis
 unavailability

---
 configuration/default_services.json          |  10 +
 requirements.in                              |   4 +-
 requirements.txt                             |   8 +-
 tests/test_integration.py                    | 319 +-----------------
 tests/testing_integration_common.py          | 321 +++++++++++++++++++
 webgui.py                                    |  46 ++-
 webinterface/common.py                       |   2 +-
 webinterface/templates/dashboards/query.html |   9 +-
 8 files changed, 374 insertions(+), 345 deletions(-)
 create mode 100644 tests/testing_integration_common.py

diff --git a/configuration/default_services.json b/configuration/default_services.json
index a2adc98d..c6390c80 100755
--- a/configuration/default_services.json
+++ b/configuration/default_services.json
@@ -33,5 +33,15 @@
         "name": "Workers",
         "systemd_service": ["mercure_worker_fast@1.service", "mercure_worker_fast@2.service", "mercure_worker_slow@1.service", "mercure_worker_slow@2.service"],
         "docker_service": ["mercure_worker_fast_1", "mercure_worker_fast_2", "mercure_worker_slow_1", "mercure_worker_slow_2"]
+    },
+    "redis": {
+        "name": "Redis",
+        "systemd_service": "mercure_redis.service",
+        "docker_service": "mercure_redis_1"
+    },
+    "ui": {
+        "name": "UI",
+        "systemd_service": "mercure_ui.service",
+        "docker_service": "mercure_ui_1"
     }
 }
diff --git a/requirements.in b/requirements.in
index ea293b9f..696c90fa 100644
--- a/requirements.in
+++ b/requirements.in
@@ -31,9 +31,9 @@ aiofiles
 jinja2
 types-Jinja2
 # 0.15.0 breaks session management; the next commit after 0.18 will include the fix
-starlette ~= 0.28
+starlette ~= 0.38.5
 starlette-auth-toolkit
-uvicorn == 0.16.0
+uvicorn ~= 0.30.6
 itsdangerous
 python-multipart
 distro
diff --git a/requirements.txt b/requirements.txt
index 31d7aedf..a1b05786 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -22,8 +22,6 @@ alembic==1.13.1
     # via -r requirements.in
 anyio==4.4.0
     # via starlette
-asgiref==3.8.1
-    # via uvicorn
 async-timeout==4.0.3
     # via
     #   aiohttp
@@ -243,7 +241,7 @@ sqlalchemy==1.4.52
     #   -r requirements.in
     #   alembic
     #   databases
-starlette==0.37.2
+starlette==0.38.5
     # via
     #   -r requirements.in
     #   starlette-auth-toolkit
@@ -268,10 +266,10 @@ typing-extensions==4.12.2
     #   aiosqlite
     #   alembic
     #   anyio
-    #   asgiref
     #   mypy
     #   pydantic
     #   reactivex
+    #   uvicorn
 urllib3==2.2.2
     # via
     #   -r requirements.in
@@ -280,8 +278,8 @@ urllib3==2.2.2
     #   influxdb-client
     #   requests
     #   types-requests
-uvicorn==0.16.0
     # via -r requirements.in
+uvicorn==0.30.6
 watchdog==4.0.1
     # via -r requirements.in
 wheel==0.43.0
diff --git a/tests/test_integration.py b/tests/test_integration.py
index 97cab986..874eb2c6 100644
--- a/tests/test_integration.py
+++ b/tests/test_integration.py
@@ -1,329 +1,12 @@
 from dataclasses import dataclass
-import functools
-import json
-import multiprocessing
 import os
 from pathlib import Path
-import subprocess
-import sys
-import threading
 import time
-from typing import Any, Callable, Generator, Optional
 import pytest
-import requests
-from supervisor.supervisord import Supervisor
-from supervisor.states import RUNNING_STATES
-from supervisor.options import ServerOptions
-from supervisor.xmlrpc import SupervisorTransport
-import xmlrpc.client
-import tempfile
-from common.config import mercure_defaults
 from common.types import FolderTarget, Module, Rule, Target
 from tests.testing_common import create_minimal_dicom
-import pydicom
-import logging
-import socket
-import tempfile
-
-# current workding directory
-here = os.path.abspath(os.getcwd())
-
-def send_dicom(ds, dest_host, dest_port) -> None:
-    with tempfile.NamedTemporaryFile('w') as ds_temp:
-        ds.save_as(ds_temp.name)
-        subprocess.run(["dcmsend", dest_host, str(dest_port), ds_temp.name],check=True)
-
-
-class SupervisorManager:
-    process: Optional[multiprocessing.Process] = None
-    config_path: Optional[Path] = None
-    def __init__(self, mercure_base: Path) -> None:
-        self.mercure_base = mercure_base
-        self.socket = mercure_base / "supervisor.sock"
-
-    def create_config(self, services) -> None:
-        self.config_path = self.mercure_base / 'supervisord.conf'
-        log_path = self.mercure_base / 'supervisord.logs'
-        pidfile = self.mercure_base / 'supervisord.pid'
-        self.config_path.touch()
-
-        with self.config_path.open('w') as f:
-            f.write(f"""
-[supervisord]
-nodaemon=true
-identifier=supervisor
-directory=/tmp
-loglevel=info
-pidfile={pidfile}
-sockfile={self.socket}
-logfile={log_path}
-[rpcinterface:supervisor]
-supervisor.rpcinterface_factory = supervisor.rpcinterface:make_main_rpcinterface
-[unix_http_server]
-file={self.socket}
-[supervisorctl]
-serverurl=unix://{self.socket}
-""")
-            for service in services:
-                f.write(f"""
-[program:{service.name}]
-command={service.command}
-process_name=%(program_name)s{'_%(process_num)d' if service.numprocs>1 else ''}
-directory={os.getcwd()}
-autostart=false
-autorestart=false
-redirect_stderr=true
-startsecs={service.startsecs}
-stopasgroup={str(service.stopasgroup).lower()}
-numprocs={service.numprocs}
-environment=MERCURE_CONFIG_FOLDER="{self.mercure_base}/config"
-""")
-
-    def run(self) -> None:
-        args = ['-c', str(self.config_path)]
-        options = ServerOptions()
-        options.realize(args)
-        
-        s = Supervisor(options)
-        options.first = True
-        options.test = False
-        try:
-            s.main()
-        except Exception as e:
-            print(e)
-
-    def start(self, services) -> None:
-        self.create_config(services)
-        self.process = multiprocessing.Process(target=self.run)
-        self.process.start()
-        self.wait_for_start()
-        self.transport = SupervisorTransport(None, None, f'unix://{self.socket}')
-        self.rpc = xmlrpc.client.ServerProxy('http://localhost', transport=self.transport)
-
-    def start_service(self, name) -> None:
-        self.rpc.supervisor.startProcess(name)
-
-    def stop_service(self, name)-> None:
-        self.rpc.supervisor.stopProcess(name)
-
-    def all_services(self) -> Any:
-        return self.rpc.supervisor.getAllProcessInfo() # type: ignore
-
-    def get_service_log(self, name, offset=0, length=10000) -> Any:
-        return self.rpc.supervisor.readProcessStdoutLog(name, offset, length) # type: ignore
-
-    def stream_service_logs(self, name, timeout=1) -> None:
-        offset = 0
-        while True:
-            log_data, offset, overflow = self.rpc.supervisor.tailProcessStdoutLog(name, offset, 1024) # type: ignore
-            if log_data:
-                print(log_data, end='', flush=True)
-            if overflow:
-                print(f"Warning: Log overflow detected for {name}. Some log entries may have been missed.")
-            time.sleep(timeout)
-
-    def stream_service_logs_threaded(self, name, timeout=1) -> threading.Thread:
-        thread = threading.Thread(target=self.stream_service_logs, args=(name, timeout))
-        thread.start()
-        return thread
-    def wait_for_start(self) -> None:
-        while True:
-            if Path(self.socket).exists():
-                break
-            else:
-                time.sleep(0.1)
-    def stop(self) -> None:
-        if not self.process:
-            return
-        try:
-            self.transport.close()
-            self.process.terminate()
-            self.process.join()
-        except Exception as e:
-            print(e)
-            pass
-
-@dataclass
-class MercureService:
-    name: str
-    command: str
-    numprocs: int = 1
-    stopasgroup: bool = False
-    startsecs: int = 0
-
-def is_dicoms_received(mercure_base, dicoms) -> None:
-    dicoms_recieved = set()
-    for series_folder in (mercure_base / 'data' / 'incoming').glob('*/'):
-        for dicom in series_folder.glob('*.dcm'):
-            ds_ = pydicom.dcmread(dicom)
-            assert ds_.SeriesInstanceUID == series_folder.name
-            assert ds_.SOPInstanceUID not in dicoms_recieved
-            dicoms_recieved.add(ds_.SOPInstanceUID) 
-            
-    assert dicoms_recieved == set(ds.SOPInstanceUID for ds in dicoms)
-    print(f"Received {len(dicoms)} dicoms as expected")
-
-def is_dicoms_in_folder(folder, dicoms) -> None:
-    uids_found = set()
-    print(f"Looking for dicoms in {folder}")
-    dicoms_found = []
-    for f in folder.rglob('*'):
-        if not f.is_file():
-            continue
-        if f.suffix == '.dcm':
-            dicoms_found.append(f)
-        if f.suffix not in ('.error','.tags'):
-            dicoms_found.append(f)
-    print("Dicoms", dicoms_found)
-    for dicom in dicoms_found:
-        
-        try:
-            uid = pydicom.dcmread(dicom).SOPInstanceUID
-            uids_found.add(uid)
-        except Exception as e:
-            pass
-    try:
-        assert uids_found == set(ds.SOPInstanceUID for ds in dicoms), f"Dicoms missing from {folder}"
-    except:
-        print("Expected dicoms not found")
-        for dicom in folder.glob('**/*.dcm'):
-            print(dicom)
-        raise
-    print(f"Found {len(dicoms)} dicoms in {folder.name} as expected")
-
-def is_series_registered(bookkeeper_port, dicoms) -> None:
-    result = requests.get(f"http://localhost:{bookkeeper_port}/query/series",
-                            headers={"Authorization": f"Token test"})
-    assert result.status_code == 200
-    result_json = result.json()
-    assert set([r['series_uid'] for r in result_json]) == set([d.SeriesInstanceUID for d in dicoms])
-
-@pytest.fixture(scope="function")
-def supervisord(mercure_base):
-    supervisor: Optional[SupervisorManager] = None
-    def starter(services=[]):
-        nonlocal supervisor
-        if not supervisor:
-            supervisor = SupervisorManager(mercure_base)
-            supervisor.start(services)
-            return supervisor
-        return supervisor
-    yield starter
-    if supervisor is not None:
-        supervisor.stop()
-
-
-def stop_mercure(supervisor: SupervisorManager):
-    logs = {}
-    for service in supervisor.all_services():
-        if service['state'] in RUNNING_STATES:
-            try:
-                supervisor.stop_service(service['name'])
-            except xmlrpc.client.Fault as e:
-                if e.faultCode == 10:
-                    supervisor.stop_service(service['group']+":*")
-        # log = get_service_log(service['name'])
-        # if log:
-        log =  Path(service['stdout_logfile']).read_text()
-        if log:
-            logs[service['name']] = log
-    return logs
-
-@pytest.fixture(scope="session")
-def python_bin():
-    if os.environ.get("CLEAN_VENV"):
-        with tempfile.TemporaryDirectory(prefix="mercure_venv") as venvdir:
-            subprocess.run([sys.executable, "-m", "venv", venvdir], check=True)
-            subprocess.run([os.path.join(venvdir, "bin", "pip"), "install", "-r", f"{here}/requirements.txt"], check=True)
-            yield venvdir+"/bin/python"
-    else:
-        yield sys.executable
-
-@pytest.fixture(scope="function")
-def mercure(mercure_base, supervisord: Callable[[Any], SupervisorManager], python_bin) -> Generator[Callable[[Any],SupervisorManager], None, None]:
-    def py_service(service, **kwargs) -> MercureService:
-        return MercureService(service,f"{python_bin} {here}/{service}.py", **kwargs)
-    services = [
-        py_service("bookkeeper",startsecs=6),
-        py_service("router", numprocs=5),
-        py_service("processor", numprocs=2),
-        py_service("dispatcher", numprocs=5),
-    ]
-    services += [MercureService(f"receiver", f"{here}/receiver.sh --inject-errors", stopasgroup=True)]
-    supervisor = supervisord(services)
-    def do_start(services_to_start=["bookkeeper", "reciever", "router", "processor", "dispatcher"]) -> SupervisorManager:
-        for service in services_to_start:
-            supervisor.start_service(service)
-        return supervisor
-    yield do_start
-    logs = stop_mercure(supervisor)
-    for l in logs:
-        print(f"====== {l} ======")
-        print(logs[l])
-    print("=============")
-
-@pytest.fixture(scope="function")
-def mercure_base() -> Generator[Path, None, None]:
-    with tempfile.TemporaryDirectory(prefix='mercure_') as temp_dir:
-        temp_path = Path(temp_dir)
-        for d in ['config','data']:
-            (temp_path / d).mkdir()
-        for k in ["incoming", "studies", "outgoing", "success", "error", "discard", "processing"]:
-            (temp_path / 'data' / k).mkdir()
-        yield temp_path
-
-def random_port() -> int:
-    """
-    Generate a free port number to use as an ephemeral endpoint.
-    """
-    s = socket.socket() 
-    s.bind(('',0)) # bind to any available port
-    port = s.getsockname()[1] # get the port number
-    s.close()
-    return int(port)
-
-
-@pytest.fixture(scope="module")
-def receiver_port():
-    return random_port()
-
-@pytest.fixture(scope="module")
-def bookkeeper_port():
-    return random_port()
-
-
-@pytest.fixture(scope="function")
-def mercure_config(mercure_base, receiver_port, bookkeeper_port):
-    mercure_config = { k: v for k, v in mercure_defaults.items()}
-    for folder in (mercure_base / 'data').iterdir():
-        mercure_config[f"{folder.name}_folder"] = str(folder)
-
-    mercure_config["series_complete_trigger"] = 1
-    mercure_config["study_complete_trigger"] = 2
-    mercure_config["bookkeeper_api_key"] = "test"
-    mercure_config["port"] = receiver_port
-    mercure_config["bookkeeper"] = f"localhost:{bookkeeper_port}"
-    with (mercure_base / 'config' / 'mercure.json').open('w') as fp:
-        json.dump(mercure_config, fp)
-
-    bookkeeper_config = f"""
-PORT={bookkeeper_port}
-HOST=0.0.0.0
-DATABASE_URL=sqlite:///{mercure_base}/data/bookkeeper.sqlite3
-DEBUG=True
-"""
-    with (mercure_base / 'config' / 'bookkeeper.env').open('w') as fp:
-        fp.write(bookkeeper_config)
-    
-    def update_config(config):
-        with (mercure_base / 'config' / 'mercure.json').open('r+') as fp:
-            data = json.load(fp)
-            data.update(config)
-            fp.seek(0)
-            json.dump(data, fp)
-            fp.truncate()
-    return update_config
 
+from testing_integration_common import *
 
 @pytest.mark.parametrize("n_series",(2,))
 @pytest.mark.skipif("os.getenv('TEST_FAST',False)")
diff --git a/tests/testing_integration_common.py b/tests/testing_integration_common.py
new file mode 100644
index 00000000..bd63cd83
--- /dev/null
+++ b/tests/testing_integration_common.py
@@ -0,0 +1,321 @@
+from dataclasses import dataclass
+import json
+import multiprocessing
+import os
+from pathlib import Path
+import subprocess
+import sys
+import threading
+import time
+from typing import Any, Callable, Generator, Optional
+import pytest
+import requests
+from supervisor.supervisord import Supervisor
+from supervisor.states import RUNNING_STATES
+from supervisor.options import ServerOptions
+from supervisor.xmlrpc import SupervisorTransport
+import xmlrpc.client
+import tempfile
+from common.config import mercure_defaults
+import pydicom
+import socket
+import tempfile
+
+# current workding directory
+here = os.path.abspath(os.getcwd())
+
+def send_dicom(ds, dest_host, dest_port) -> None:
+    with tempfile.NamedTemporaryFile('w') as ds_temp:
+        ds.save_as(ds_temp.name)
+        subprocess.run(["dcmsend", dest_host, str(dest_port), ds_temp.name],check=True)
+
+
+class SupervisorManager:
+    process: Optional[multiprocessing.Process] = None
+    config_path: Optional[Path] = None
+    def __init__(self, mercure_base: Path) -> None:
+        self.mercure_base = mercure_base
+        self.socket = mercure_base / "supervisor.sock"
+
+    def create_config(self, services) -> None:
+        self.config_path = self.mercure_base / 'supervisord.conf'
+        log_path = self.mercure_base / 'supervisord.logs'
+        pidfile = self.mercure_base / 'supervisord.pid'
+        self.config_path.touch()
+
+        with self.config_path.open('w') as f:
+            f.write(f"""
+[supervisord]
+nodaemon=true
+identifier=supervisor
+directory=/tmp
+loglevel=info
+pidfile={pidfile}
+sockfile={self.socket}
+logfile={log_path}
+[rpcinterface:supervisor]
+supervisor.rpcinterface_factory = supervisor.rpcinterface:make_main_rpcinterface
+[unix_http_server]
+file={self.socket}
+[supervisorctl]
+serverurl=unix://{self.socket}
+""")
+            for service in services:
+                f.write(f"""
+[program:{service.name}]
+command={service.command}
+process_name=%(program_name)s{'_%(process_num)d' if service.numprocs>1 else ''}
+directory={os.getcwd()}
+autostart=false
+autorestart=false
+redirect_stderr=true
+startsecs={service.startsecs}
+stopasgroup={str(service.stopasgroup).lower()}
+numprocs={service.numprocs}
+environment=MERCURE_CONFIG_FOLDER="{self.mercure_base}/config"
+""")
+
+    def run(self) -> None:
+        args = ['-c', str(self.config_path)]
+        options = ServerOptions()
+        options.realize(args)
+        
+        s = Supervisor(options)
+        options.first = True
+        options.test = False
+        try:
+            s.main()
+        except Exception as e:
+            print(e)
+
+    def start(self, services) -> None:
+        self.create_config(services)
+        self.process = multiprocessing.Process(target=self.run)
+        self.process.start()
+        self.wait_for_start()
+        self.transport = SupervisorTransport(None, None, f'unix://{self.socket}')
+        self.rpc = xmlrpc.client.ServerProxy('http://localhost', transport=self.transport)
+
+    def start_service(self, name) -> None:
+        self.rpc.supervisor.startProcess(name)
+
+    def stop_service(self, name)-> None:
+        self.rpc.supervisor.stopProcess(name)
+
+    def all_services(self) -> Any:
+        return self.rpc.supervisor.getAllProcessInfo() # type: ignore
+
+    def get_service_log(self, name, offset=0, length=10000) -> Any:
+        return self.rpc.supervisor.readProcessStdoutLog(name, offset, length) # type: ignore
+
+    def stream_service_logs(self, name, timeout=1) -> None:
+        offset = 0
+        while True:
+            log_data, offset, overflow = self.rpc.supervisor.tailProcessStdoutLog(name, offset, 1024) # type: ignore
+            if log_data:
+                print(log_data, end='', flush=True)
+            if overflow:
+                print(f"Warning: Log overflow detected for {name}. Some log entries may have been missed.")
+            time.sleep(timeout)
+
+    def stream_service_logs_threaded(self, name, timeout=1) -> threading.Thread:
+        thread = threading.Thread(target=self.stream_service_logs, args=(name, timeout))
+        thread.start()
+        return thread
+    def wait_for_start(self) -> None:
+        while True:
+            if Path(self.socket).exists():
+                break
+            else:
+                time.sleep(0.1)
+    def stop(self) -> None:
+        if not self.process:
+            return
+        try:
+            self.transport.close()
+            self.process.terminate()
+            self.process.join()
+        except Exception as e:
+            print(e)
+            pass
+
+@dataclass
+class MercureService:
+    name: str
+    command: str
+    numprocs: int = 1
+    stopasgroup: bool = False
+    startsecs: int = 0
+
+def is_dicoms_received(mercure_base, dicoms) -> None:
+    dicoms_recieved = set()
+    for series_folder in (mercure_base / 'data' / 'incoming').glob('*/'):
+        for dicom in series_folder.glob('*.dcm'):
+            ds_ = pydicom.dcmread(dicom)
+            assert ds_.SeriesInstanceUID == series_folder.name
+            assert ds_.SOPInstanceUID not in dicoms_recieved
+            dicoms_recieved.add(ds_.SOPInstanceUID) 
+            
+    assert dicoms_recieved == set(ds.SOPInstanceUID for ds in dicoms)
+    print(f"Received {len(dicoms)} dicoms as expected")
+
+def is_dicoms_in_folder(folder, dicoms) -> None:
+    uids_found = set()
+    print(f"Looking for dicoms in {folder}")
+    dicoms_found = []
+    for f in folder.rglob('*'):
+        if not f.is_file():
+            continue
+        if f.suffix == '.dcm':
+            dicoms_found.append(f)
+        if f.suffix not in ('.error','.tags'):
+            dicoms_found.append(f)
+    print("Dicoms", dicoms_found)
+    for dicom in dicoms_found:
+        
+        try:
+            uid = pydicom.dcmread(dicom).SOPInstanceUID
+            uids_found.add(uid)
+        except Exception as e:
+            pass
+    try:
+        assert uids_found == set(ds.SOPInstanceUID for ds in dicoms), f"Dicoms missing from {folder}"
+    except:
+        print("Expected dicoms not found")
+        for dicom in folder.glob('**/*.dcm'):
+            print(dicom)
+        raise
+    print(f"Found {len(dicoms)} dicoms in {folder.name} as expected")
+
+def is_series_registered(bookkeeper_port, dicoms) -> None:
+    result = requests.get(f"http://localhost:{bookkeeper_port}/query/series",
+                            headers={"Authorization": f"Token test"})
+    assert result.status_code == 200
+    result_json = result.json()
+    assert set([r['series_uid'] for r in result_json]) == set([d.SeriesInstanceUID for d in dicoms])
+
+@pytest.fixture(scope="function")
+def supervisord(mercure_base):
+    supervisor: Optional[SupervisorManager] = None
+    def starter(services=[]):
+        nonlocal supervisor
+        if not supervisor:
+            supervisor = SupervisorManager(mercure_base)
+            supervisor.start(services)
+            return supervisor
+        return supervisor
+    yield starter
+    if supervisor is not None:
+        supervisor.stop()
+
+
+def stop_mercure(supervisor: SupervisorManager):
+    logs = {}
+    for service in supervisor.all_services():
+        if service['state'] in RUNNING_STATES:
+            try:
+                supervisor.stop_service(service['name'])
+            except xmlrpc.client.Fault as e:
+                if e.faultCode == 10:
+                    supervisor.stop_service(service['group']+":*")
+        # log = get_service_log(service['name'])
+        # if log:
+        log =  Path(service['stdout_logfile']).read_text()
+        if log:
+            logs[service['name']] = log
+    return logs
+
+@pytest.fixture(scope="session")
+def python_bin():
+    if os.environ.get("CLEAN_VENV"):
+        with tempfile.TemporaryDirectory(prefix="mercure_venv") as venvdir:
+            subprocess.run([sys.executable, "-m", "venv", venvdir], check=True)
+            subprocess.run([os.path.join(venvdir, "bin", "pip"), "install", "-r", f"{here}/requirements.txt"], check=True)
+            yield venvdir+"/bin/python"
+    else:
+        yield sys.executable
+
+@pytest.fixture(scope="function")
+def mercure(mercure_base, supervisord: Callable[[Any], SupervisorManager], python_bin) -> Generator[Callable[[Any],SupervisorManager], None, None]:
+    def py_service(service, **kwargs) -> MercureService:
+        return MercureService(service,f"{python_bin} {here}/{service}.py", **kwargs)
+    services = [
+        py_service("bookkeeper",startsecs=6),
+        py_service("router", numprocs=5),
+        py_service("processor", numprocs=2),
+        py_service("dispatcher", numprocs=5),
+    ]
+    services += [MercureService(f"receiver", f"{here}/receiver.sh --inject-errors", stopasgroup=True)]
+    supervisor = supervisord(services)
+    def do_start(services_to_start=["bookkeeper", "reciever", "router", "processor", "dispatcher"]) -> SupervisorManager:
+        for service in services_to_start:
+            supervisor.start_service(service)
+        return supervisor
+    yield do_start
+    logs = stop_mercure(supervisor)
+    for l in logs:
+        print(f"====== {l} ======")
+        print(logs[l])
+    print("=============")
+
+@pytest.fixture(scope="function")
+def mercure_base() -> Generator[Path, None, None]:
+    with tempfile.TemporaryDirectory(prefix='mercure_') as temp_dir:
+        temp_path = Path(temp_dir)
+        for d in ['config','data']:
+            (temp_path / d).mkdir()
+        for k in ["incoming", "studies", "outgoing", "success", "error", "discard", "processing", "jobs"]:
+            (temp_path / 'data' / k).mkdir()
+        yield temp_path
+
+def random_port() -> int:
+    """
+    Generate a free port number to use as an ephemeral endpoint.
+    """
+    s = socket.socket() 
+    s.bind(('',0)) # bind to any available port
+    port = s.getsockname()[1] # get the port number
+    s.close()
+    return int(port)
+
+
+@pytest.fixture(scope="module")
+def receiver_port():
+    return random_port()
+
+@pytest.fixture(scope="module")
+def bookkeeper_port():
+    return random_port()
+
+
+@pytest.fixture(scope="function")
+def mercure_config(mercure_base, receiver_port, bookkeeper_port):
+    mercure_config = { k: v for k, v in mercure_defaults.items()}
+    for folder in (mercure_base / 'data').iterdir():
+        mercure_config[f"{folder.name}_folder"] = str(folder)
+
+    mercure_config["series_complete_trigger"] = 1
+    mercure_config["study_complete_trigger"] = 2
+    mercure_config["bookkeeper_api_key"] = "test"
+    mercure_config["port"] = receiver_port
+    mercure_config["bookkeeper"] = f"localhost:{bookkeeper_port}"
+    with (mercure_base / 'config' / 'mercure.json').open('w') as fp:
+        json.dump(mercure_config, fp)
+
+    bookkeeper_config = f"""
+PORT={bookkeeper_port}
+HOST=0.0.0.0
+DATABASE_URL=sqlite:///{mercure_base}/data/bookkeeper.sqlite3
+DEBUG=True
+"""
+    with (mercure_base / 'config' / 'bookkeeper.env').open('w') as fp:
+        fp.write(bookkeeper_config)
+    
+    def update_config(config):
+        with (mercure_base / 'config' / 'mercure.json').open('r+') as fp:
+            data = json.load(fp)
+            data.update(config)
+            fp.seek(0)
+            json.dump(data, fp)
+            fp.truncate()
+    return update_config
diff --git a/webgui.py b/webgui.py
index 4d732825..d4cc12db 100755
--- a/webgui.py
+++ b/webgui.py
@@ -26,7 +26,7 @@
 import daiquiri
 import html
 from pathlib import Path
-from typing import Any, Dict, List, Optional, Union
+from typing import Any, Dict, List, Optional, TypedDict, Union
 import docker
 import hupper
 import nomad
@@ -129,27 +129,39 @@ async def authenticate(self, request):
 
 @contextlib.asynccontextmanager
 async def lifespan(app):
-    startup()
-    yield
+    result = startup(app)
+    yield result
     await shutdown()
 
 
-def startup() -> None:
-    scheduled_jobs = rq_fast_scheduler.get_jobs()
-    for job in scheduled_jobs: 
-        if job.meta.get("type") != "offpeak":
-            continue
-        rq_fast_scheduler.cancel(job)
-    rq_fast_scheduler.schedule(
-        scheduled_time=datetime.datetime.utcnow(),
-        func=WrappedJob.update_all_jobs_offpeak,
-        interval=60,
-        meta={"type": "offpeak"},
-        repeat=None
-    )
+def startup(app: Starlette):
+    state = {"redis_connected": False}
+    try:
+        response = redis.ping()
+        if response:
+            logger.info("Redis connection validated.")
+            state["redis_connected"] = True
+        else:
+            raise Exception("Redis connection failed")
+    except:
+        logger.error("Could not connect to Redis", exc_info=True)
+    
+    if state["redis_connected"]:
+        scheduled_jobs = rq_fast_scheduler.get_jobs()
+        for job in scheduled_jobs: 
+            if job.meta.get("type") != "offpeak":
+                continue
+            rq_fast_scheduler.cancel(job)
+        rq_fast_scheduler.schedule(
+            scheduled_time=datetime.datetime.utcnow(),
+            func=WrappedJob.update_all_jobs_offpeak,
+            interval=60,
+            meta={"type": "offpeak"},
+            repeat=None
+        )
     monitor.configure("webgui", "main", config.mercure.bookkeeper)
     monitor.send_event(monitor.m_events.BOOT, monitor.severity.INFO, f"PID = {os.getpid()}")
-
+    return state
 
 async def shutdown() -> None:
     monitor.send_event(monitor.m_events.SHUTDOWN, monitor.severity.INFO, "")
diff --git a/webinterface/common.py b/webinterface/common.py
index 5836801c..ad93e530 100755
--- a/webinterface/common.py
+++ b/webinterface/common.py
@@ -17,7 +17,7 @@
 from common.constants import mercure_defs
 from rq_scheduler import Scheduler
 
-redis = Redis.from_url(os.getenv("REDIS_URL","http://localhost:6379/0"))
+redis = Redis.from_url(os.getenv("REDIS_URL","redis://localhost:6379/0"))
 rq_slow_queue = Queue(name="mercure_slow", connection=redis)
 rq_fast_queue = Queue(name="mercure_fast", connection=redis)
 rq_fast_scheduler = Scheduler(queue=rq_fast_queue, connection=rq_fast_queue.connection) 
diff --git a/webinterface/templates/dashboards/query.html b/webinterface/templates/dashboards/query.html
index 40ee6e89..3b915556 100644
--- a/webinterface/templates/dashboards/query.html
+++ b/webinterface/templates/dashboards/query.html
@@ -11,6 +11,11 @@
 <main role="main">
     <h1 class="title">DICOM Query</h1>
     <div class="container">
+      {% if not request.state.redis_connected %}
+      <div id="redis-unavailable" class="notification is-danger">
+        Redis connection not available, so this dashboard will not function.
+      </div>
+      {% endif %}
         <form class="box" id="form" hx-post="query" hx-target="#query_result" hx-swap="innerHTML">
             <div class="field is-horizontal">
               <div class="field-label is-normal">
@@ -169,8 +174,8 @@ <h1 class="title">DICOM Query</h1>
 </main>
 <script>
 $(document).ready(function () {      
-    $("#form").on('htmx:afterOnLoad', (event) => {
-        datatable.ajax.reload();
+  $("#form").on('htmx:afterOnLoad', (event) => {
+      datatable.ajax.reload();
   });
 
   function namespacedEvents(config) {

From 376b1896005ad6861572b0af8dc51452b879155f Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Thu, 12 Sep 2024 23:07:18 +0000
Subject: [PATCH 36/42] fix install

---
 configuration/default_mercure.json | 1 +
 install.sh                         | 4 ++--
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/configuration/default_mercure.json b/configuration/default_mercure.json
index 23d4cffe..9ec28030 100755
--- a/configuration/default_mercure.json
+++ b/configuration/default_mercure.json
@@ -10,6 +10,7 @@
     "error_folder"               : "/opt/mercure/data/error",
     "discard_folder"             : "/opt/mercure/data/discard",
     "processing_folder"          : "/opt/mercure/data/processing",
+    "jobs_folder"                : "/opt/mercure/data/jobs",
     "bookkeeper"                 : "0.0.0.0:8080",
     "bookkeeper_api_key"         : "BOOKKEEPER_TOKEN_PLACEHOLDER",
     "graphite_ip"                :       "",
diff --git a/install.sh b/install.sh
index 78e72965..eda5901d 100755
--- a/install.sh
+++ b/install.sh
@@ -97,7 +97,7 @@ create_folders () {
       echo "## Creating $DATA_PATH..."
       sudo mkdir "$DATA_PATH"
       sudo mkdir "$DATA_PATH"/incoming "$DATA_PATH"/studies "$DATA_PATH"/outgoing "$DATA_PATH"/success
-      sudo mkdir "$DATA_PATH"/error "$DATA_PATH"/discard "$DATA_PATH"/processing
+      sudo mkdir "$DATA_PATH"/error "$DATA_PATH"/discard "$DATA_PATH"/processing "$DATA_PATH"/jobs
       sudo chown -R $OWNER:$OWNER $DATA_PATH
       sudo chmod a+x $DATA_PATH
   else
@@ -349,7 +349,7 @@ install_app_files() {
 install_packages() {
   echo "## Installing Linux packages..."
   sudo apt-get update
-  sudo apt-get install -y build-essential wget git dcmtk jq inetutils-ping sshpass rsync postgresql postgresql-contrib libpq-dev git-lfs python3-wheel python3-dev python3 python3-venv sendmail libqt5core5a
+  sudo apt-get install -y build-essential wget git dcmtk jq inetutils-ping sshpass rsync postgresql postgresql-contrib libpq-dev git-lfs python3-wheel python3-dev python3 python3-venv sendmail libqt5core5a redis
 }
 
 install_dependencies() {

From c44841beeffb41e484eb67d29fb53b25b4e8d6cf Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 13 Sep 2024 22:08:07 +0000
Subject: [PATCH 37/42] small refactor, test

---
 common/config.py                        |   1 +
 test.py                                 |   2 +-
 tests/test_query.py                     | 138 ++++++++++++++++--------
 tests/testing_integration_common.py     |  39 ++++---
 webgui.py                               |   8 +-
 webinterface/dashboards/query/jobs.py   |  57 +++++-----
 webinterface/dashboards/query_routes.py | 102 ++++++++----------
 7 files changed, 198 insertions(+), 149 deletions(-)

diff --git a/common/config.py b/common/config.py
index cf6ba58d..4786bbe7 100755
--- a/common/config.py
+++ b/common/config.py
@@ -39,6 +39,7 @@
     "error_folder": "/opt/mercure/data/error",
     "discard_folder": "/opt/mercure/data/discard",
     "processing_folder": "/opt/mercure/data/processing",
+    "jobs_folder": "/opt/mercure/data/jobs",
     "router_scan_interval": 1,  # in seconds
     "dispatcher_scan_interval": 1,  # in seconds
     "cleaner_scan_interval": 60,  # in seconds
diff --git a/test.py b/test.py
index b91ff002..85d513ad 100755
--- a/test.py
+++ b/test.py
@@ -16,7 +16,7 @@ def run_test() -> None:
     config.save_config()
 
     client = TestClient(app)
-    startup()
+    startup(app)
     form_data = {
         "username": "admin",
         "password": "router"
diff --git a/tests/test_query.py b/tests/test_query.py
index 1b514dfd..1bd075a9 100644
--- a/tests/test_query.py
+++ b/tests/test_query.py
@@ -1,6 +1,7 @@
 import os
 from pathlib import Path
 import tempfile
+from typing import Dict
 import pydicom
 import pytest
 from pynetdicom import AE, evt, StoragePresentationContexts, build_role
@@ -9,21 +10,26 @@
 from pydicom.uid import generate_uid
 from pydicom.dataset import Dataset, FileMetaDataset
 from rq import Worker
-from webinterface.dashboards.query.jobs import GetAccessionJob, WrappedJob
+from webinterface.dashboards.query.jobs import GetAccessionTask, QueryPipeline
 from webinterface.dicom_client import SimpleDicomClient
 
 from common.types import DicomTarget, DicomWebTarget
 from webinterface.common import redis
-
 from pydicom.uid import ExplicitVRLittleEndian, ImplicitVRLittleEndian
 from testing_common import receiver_port, mercure_config
 from logging import getLogger
-from rq import SimpleWorker, Queue
+from rq import SimpleWorker, Queue, Connection
 from fakeredis import FakeStrictRedis
 
 getLogger('pynetdicom').setLevel('WARNING')
 # Mock data for testing
-MOCK_ACCESSION = "12345"
+MOCK_ACCESSIONS = ["12345"]
+
+
+@pytest.fixture(scope="module", autouse=True)
+def rq_connection():
+    with Connection(redis):
+        yield redis
 
 @pytest.fixture(scope="module")
 def mock_node(receiver_port):
@@ -31,21 +37,22 @@ def mock_node(receiver_port):
 
 class DummyDICOMServer:
     """A simple DICOM server for testing purposes."""
-    def __init__(self, port:int, dataset:Dataset):
+    def __init__(self, port:int, datasets: Dict[str,Dataset]):
         assert isinstance(port, int), "Port must be an integer"
-        assert isinstance(dataset, Dataset), "Dataset must be a pydicom Dataset"
+        for ds in datasets.values():
+            assert isinstance(ds, Dataset), "Dataset must be a pydicom Dataset"
         self.ae = AE()
         # Add support for DICOM verification
         self.ae.add_supported_context(Verification)
-        self.dataset = dataset
+        self.datasets = datasets
         # Define handler for C-FIND requests
         def handle_find(event):
             ds = event.identifier
 
             # Create a dummy response
             # Check if the request matches our dummy data
-            if 'AccessionNumber' in ds and ds.AccessionNumber == MOCK_ACCESSION:
-                yield (0xFF00, self.dataset)
+            if 'AccessionNumber' in ds and ds.AccessionNumber in MOCK_ACCESSIONS:
+                yield (0xFF00, self.datasets[ds.AccessionNumber])
             else:
                 yield (0x0000, None)  # Status 'Success', but no match
 
@@ -54,11 +61,11 @@ def handle_get(event):
             ds = event.identifier
             # yield 1
             # Check if the request matches our dummy data
-            if 'AccessionNumber' in ds and ds.AccessionNumber == MOCK_ACCESSION:
+            if 'AccessionNumber' in ds and ds.AccessionNumber in MOCK_ACCESSIONS:
                 # Create a dummy DICOM dataset
                 yield 1
 
-                dummy_ds = self.dataset.copy()
+                dummy_ds = self.datasets[ds.AccessionNumber].copy()
                 dummy_ds.SOPClassUID = CTImageStorage  # CT Image Storage
                 dummy_ds.SOPInstanceUID = generate_uid()
                 dummy_ds.file_meta = FileMetaDataset()
@@ -90,40 +97,44 @@ def stop(self)->None:
         self.ae.shutdown()
 
 @pytest.fixture(scope="function")
-def dummy_dataset():
-    ds = Dataset()
-    ds.PatientName = "Test^Patient"
-    ds.PatientID = "12345"
-    ds.StudyDescription = "Test Study"
-    ds.StudyDate = "20210101"
-    ds.StudyInstanceUID = generate_uid()
-    ds.SeriesInstanceUID = generate_uid()
-    ds.AccessionNumber = MOCK_ACCESSION
-    ds.is_little_endian = True
-    ds.is_implicit_VR = False
-    return ds
+def dummy_datasets():
+    dss = {}
+    for acc in MOCK_ACCESSIONS:
+        ds = Dataset()
+        ds.PatientName = "Test^Patient"
+        ds.PatientID = "12345"
+        ds.StudyDescription = "Test Study"
+        ds.StudyDate = "20210101"
+        ds.StudyInstanceUID = generate_uid()
+        ds.SeriesInstanceUID = generate_uid()
+        ds.AccessionNumber = acc
+        ds.is_little_endian = True
+        ds.is_implicit_VR = False
+        dss[acc] = ds
+    return dss
 
 @pytest.fixture(scope="function")
-def dicom_server(mock_node, dummy_dataset):
+def dicom_server(mock_node, dummy_datasets):
     """
     Pytest fixture to start a DICOM server before tests and stop it after.
     This fixture has module scope, so the server will be started once for all tests in the module.
     """
-    server = DummyDICOMServer(int(mock_node.port), dummy_dataset)
+    server = DummyDICOMServer(int(mock_node.port), dummy_datasets)
     yield mock_node
     server.stop()
 
 @pytest.fixture(scope="function")
-def dicomweb_server(dummy_dataset, tempdir):
-    ds = dummy_dataset.copy()
-    ds.SOPClassUID = CTImageStorage  # CT Image Storage
-    ds.SOPInstanceUID = generate_uid()
-    ds.StudyInstanceUID = generate_uid()
-    ds.file_meta = FileMetaDataset()
-    ds.file_meta.TransferSyntaxUID = ExplicitVRLittleEndian
-    
+def dicomweb_server(dummy_datasets, tempdir):
     (tempdir / "dicomweb").mkdir()
-    ds.save_as(tempdir / "dicomweb" / "dummy.dcm", write_like_original=False)
+
+    for dummy_dataset in dummy_datasets.values():
+        ds = dummy_dataset.copy()
+        ds.SOPClassUID = CTImageStorage  # CT Image Storage
+        ds.SOPInstanceUID = generate_uid()
+        ds.StudyInstanceUID = generate_uid()
+        ds.file_meta = FileMetaDataset()
+        ds.file_meta.TransferSyntaxUID = ExplicitVRLittleEndian
+        ds.save_as(tempdir / "dicomweb" / ds.SOPInstanceUID, write_like_original=False)
 
     yield DicomWebTarget(url=f"file://{tempdir}/dicomweb")
 
@@ -131,9 +142,9 @@ def test_simple_dicom_client(dicom_server):
     """Test the SimpleDicomClient can connect to and query the DICOM server."""
     client = SimpleDicomClient(dicom_server.ip, dicom_server.port, dicom_server.aet_target, None)
     
-    result = client.findscu(MOCK_ACCESSION)
+    result = client.findscu(MOCK_ACCESSIONS[0])
     assert result is not None  # We expect some result, even if it's an empty dataset
-    assert result[0].AccessionNumber == MOCK_ACCESSION  # Check if the accession number matches
+    assert result[0].AccessionNumber == MOCK_ACCESSIONS[0]  # Check if the accession number matches
 
 @pytest.fixture(scope="function")
 def tempdir():
@@ -149,25 +160,25 @@ def test_get_accession_job(dicom_server, dicomweb_server, mercure_config):
     (Path(config.jobs_folder) / "foo/").touch()
     for server in (dicom_server, dicomweb_server):
         
-        generator = GetAccessionJob.get_accession(job_id, MOCK_ACCESSION, server, search_filters={}, path=config.jobs_folder)
+        generator = GetAccessionTask.get_accession(job_id, MOCK_ACCESSIONS[0], server, search_filters={}, path=config.jobs_folder)
         results = list(generator)
         # Check that we got some results
         assert len(results) > 0
         assert results[0].remaining == 0
-        assert pydicom.dcmread(next(k for k in Path(config.jobs_folder).rglob("*.dcm"))).AccessionNumber == MOCK_ACCESSION
+        assert pydicom.dcmread(next(k for k in Path(config.jobs_folder).rglob("*.dcm"))).AccessionNumber == MOCK_ACCESSIONS[0]
 
 def test_query_job(dicom_server, tempdir):
     """
     Test the create_job function.
     We use mocker to mock the queue and avoid actually creating jobs.
     """
-    job = WrappedJob.create([MOCK_ACCESSION], {}, dicom_server, str(tempdir))
+    job = QueryPipeline.create([MOCK_ACCESSIONS[0]], {}, dicom_server, str(tempdir))
     assert job
     w = SimpleWorker(["mercure_fast", "mercure_slow"], connection=redis)
     w.work(burst=True)
     # assert len(list(Path(config.mercure.jobs_folder).iterdir())) == 1
     print([k for k in Path(tempdir).rglob('*')])
-    assert pydicom.dcmread(next(k for k in Path(tempdir).rglob("*.dcm"))).AccessionNumber == MOCK_ACCESSION
+    assert pydicom.dcmread(next(k for k in Path(tempdir).rglob("*.dcm"))).AccessionNumber == MOCK_ACCESSIONS[0]
 
 def tree(path, prefix='', level=0) -> None:
     if level==0:
@@ -182,15 +193,48 @@ def tree(path, prefix='', level=0) -> None:
         if entry.is_dir():
             tree(entry.path, prefix + ('    ' if i == len(entries) - 1 else '│   '), level+1)
 
-def test_query_dicomweb(dicomweb_server, tempdir, dummy_dataset, fs):
+def test_query_dicomweb(dicomweb_server, tempdir, dummy_datasets, fs):
     (tempdir / "outdir").mkdir()
-    wrapped_job = WrappedJob.create([MOCK_ACCESSION], {}, dicomweb_server, (tempdir / "outdir"))
-    assert wrapped_job
+    ds = list(dummy_datasets.values())[0]
+    task = QueryPipeline.create([ds.AccessionNumber], {}, dicomweb_server, (tempdir / "outdir"))
+    assert task
     w = SimpleWorker(["mercure_fast", "mercure_slow"], connection=redis)
     w.work(burst=True)
     # tree(tempdir / "outdir")
-    outfile = (tempdir / "outdir" / wrapped_job.id / dummy_dataset.AccessionNumber /  f"{dummy_dataset.SOPInstanceUID}.dcm")
+    outfile = (tempdir / "outdir" / task.id / ds.AccessionNumber /  f"{ds.SOPInstanceUID}.dcm")
     assert outfile.exists(), f"Expected output file {outfile} does not exist."
-    wrapped_job.get_meta()
-    assert wrapped_job.meta['completed'] == 1
-    assert wrapped_job.meta['total'] == 1
\ No newline at end of file
+    task.get_meta()
+    assert task.meta['completed'] == 1
+    assert task.meta['total'] == 1
+
+def test_query_operations(dicomweb_server, tempdir, dummy_datasets, fs, rq_connection):
+    (tempdir / "outdir").mkdir()
+    task = QueryPipeline.create([ds.AccessionNumber for ds in dummy_datasets.values()], {}, dicomweb_server, (tempdir / "outdir"))
+    assert task
+    assert task.meta['total'] == len(dummy_datasets)
+    assert task.meta['completed'] == 0
+    task.pause()
+    for job in (jobs:=task.get_subjobs()):
+        assert job.meta.get("paused")
+        assert job.get_status() == "canceled"
+    assert jobs
+
+    w = SimpleWorker(["mercure_fast", "mercure_slow"], connection=redis)
+    w.work(burst=True)
+    outfile = (tempdir / "outdir" / task.id)
+    task.get_meta()
+    assert task.meta['completed'] == 0
+    assert not outfile.exists()
+    task.resume()
+
+    for job in task.get_subjobs():
+        assert not job.meta.get("paused")
+        assert job.get_status() == "queued"
+    w = SimpleWorker(["mercure_fast", "mercure_slow"], connection=redis)
+    w.work(burst=True)
+    for ds in dummy_datasets.values():
+        outfile = (tempdir / "outdir" / task.id / ds.AccessionNumber /  f"{ds.SOPInstanceUID}.dcm")
+        assert outfile.exists(), f"Expected output file {outfile} does not exist."
+    task.get_meta()
+    assert task.meta['completed'] == len(dummy_datasets)
+    assert task.meta['total'] == len(dummy_datasets)
diff --git a/tests/testing_integration_common.py b/tests/testing_integration_common.py
index bd63cd83..2c2e94c3 100644
--- a/tests/testing_integration_common.py
+++ b/tests/testing_integration_common.py
@@ -7,7 +7,7 @@
 import sys
 import threading
 import time
-from typing import Any, Callable, Generator, Optional
+from typing import Any, Callable, Dict, Generator, Optional
 import pytest
 import requests
 from supervisor.supervisord import Supervisor
@@ -21,6 +21,7 @@
 import socket
 import tempfile
 
+
 # current workding directory
 here = os.path.abspath(os.getcwd())
 
@@ -61,6 +62,13 @@ def create_config(self, services) -> None:
 serverurl=unix://{self.socket}
 """)
             for service in services:
+                # environment=""
+                # if service.environment:
+                #     environment = ","
+                #     for key, value in service.environment.items():
+                #         environment += f"{key}=\"{value}\","
+                #     if environment[-1] == ',':
+                #         environment = environment[:-1]
                 f.write(f"""
 [program:{service.name}]
 command={service.command}
@@ -235,15 +243,30 @@ def python_bin():
     else:
         yield sys.executable
 
+
+@pytest.fixture(scope="function")
+def mercure_base() -> Generator[Path, None, None]:
+    with tempfile.TemporaryDirectory(prefix='mercure_') as temp_dir:
+        temp_path = Path(temp_dir)
+        for d in ['config','data']:
+            (temp_path / d).mkdir()
+        for k in ["incoming", "studies", "outgoing", "success", "error", "discard", "processing", "jobs"]:
+            (temp_path / 'data' / k).mkdir()
+        yield temp_path
+
 @pytest.fixture(scope="function")
-def mercure(mercure_base, supervisord: Callable[[Any], SupervisorManager], python_bin) -> Generator[Callable[[Any],SupervisorManager], None, None]:
+def mercure(supervisord: Callable[[Any], SupervisorManager], python_bin) -> Generator[Callable[[Any],SupervisorManager], None, None]:
     def py_service(service, **kwargs) -> MercureService:
-        return MercureService(service,f"{python_bin} {here}/{service}.py", **kwargs)
+        if 'command' not in kwargs:
+            kwargs['command'] = f"{python_bin} {here}/{service}.py"
+        return MercureService(service,**kwargs)
     services = [
         py_service("bookkeeper",startsecs=6),
         py_service("router", numprocs=5),
         py_service("processor", numprocs=2),
         py_service("dispatcher", numprocs=5),
+        py_service("worker_fast", command=f"{python_bin} -m rq.cli worker mercure_fast"),
+        py_service("worker_slow", command=f"{python_bin} -m rq.cli worker mercure_slow")
     ]
     services += [MercureService(f"receiver", f"{here}/receiver.sh --inject-errors", stopasgroup=True)]
     supervisor = supervisord(services)
@@ -258,16 +281,6 @@ def do_start(services_to_start=["bookkeeper", "reciever", "router", "processor",
         print(logs[l])
     print("=============")
 
-@pytest.fixture(scope="function")
-def mercure_base() -> Generator[Path, None, None]:
-    with tempfile.TemporaryDirectory(prefix='mercure_') as temp_dir:
-        temp_path = Path(temp_dir)
-        for d in ['config','data']:
-            (temp_path / d).mkdir()
-        for k in ["incoming", "studies", "outgoing", "success", "error", "discard", "processing", "jobs"]:
-            (temp_path / 'data' / k).mkdir()
-        yield temp_path
-
 def random_port() -> int:
     """
     Generate a free port number to use as an ephemeral endpoint.
diff --git a/webgui.py b/webgui.py
index d4cc12db..6b4ada4a 100755
--- a/webgui.py
+++ b/webgui.py
@@ -67,7 +67,7 @@
 import webinterface.api as api
 import webinterface.dashboards as dashboards
 from webinterface.common import *
-from webinterface.dashboards.query.jobs import WrappedJob
+from webinterface.dashboards.query.jobs import QueryPipeline
 from decoRouter import Router as decoRouter
 router = decoRouter()
 
@@ -154,7 +154,7 @@ def startup(app: Starlette):
             rq_fast_scheduler.cancel(job)
         rq_fast_scheduler.schedule(
             scheduled_time=datetime.datetime.utcnow(),
-            func=WrappedJob.update_all_jobs_offpeak,
+            func=QueryPipeline.update_all_offpeak,
             interval=60,
             meta={"type": "offpeak"},
             repeat=None
@@ -751,7 +751,7 @@ async def get_service_status(runtime) -> List[Dict[str, Any]]:
     except:
         logger.exception("Failed to get service status.")
     finally:
-        return service_status.values()
+        return list(service_status.values())
 
 @router.get("/")
 @requires("authenticated", redirect="login")
@@ -781,7 +781,7 @@ async def homepage(request) -> Response:
         service_status = await get_service_status(runtime)
     except Exception as e:
         logger.error(f"Error getting service status: {e}")
-        service_status = {}
+        service_status = [{}]
 
     template = "index.html"
     context = {
diff --git a/webinterface/dashboards/query/jobs.py b/webinterface/dashboards/query/jobs.py
index 3e50ae14..3d074918 100644
--- a/webinterface/dashboards/query/jobs.py
+++ b/webinterface/dashboards/query/jobs.py
@@ -9,7 +9,6 @@
 import typing
 
 
-from dicomweb_client import DICOMfileClient
 from common.types import DicomTarget, DicomWebTarget, FolderTarget
 from dispatch.target_types.base import ProgressInfo
 from dispatch.target_types.registry import get_handler
@@ -51,7 +50,7 @@ def query_dummy(job_id, job_kwargs):
 
 
 @dataclass
-class ClassBasedRQJob():
+class ClassBasedRQTask():
     parent: Optional[str] = None
     type: str = "unknown"
     _job: Optional[Job] = None
@@ -61,7 +60,7 @@ class ClassBasedRQJob():
     def queue(cls) -> Queue:
         return Queue(cls._queue, connection=redis)
 
-    def create(self, rq_options={}, **kwargs) -> Job:
+    def create_job(self, rq_options={}, **kwargs) -> Job:
         fields = dataclasses.fields(self)
         meta = {field.name: getattr(self, field.name) for field in fields}
         return Job.create(self._execute, kwargs=kwargs, meta=meta, **rq_options)
@@ -98,11 +97,10 @@ def move_to_destination(path, destination, job_id) -> None:
             dest_folder.mkdir(exist_ok=True)
             logger.info(f"moving {path} to {dest_folder}")
             shutil.move(path, dest_folder)
-            # tree(dest_folder)
-            logger.info(f"moved")
+
 
 @dataclass 
-class CheckAccessionsJob(ClassBasedRQJob):
+class CheckAccessionsTask(ClassBasedRQTask):
     type: str = "check_accessions"
     _queue: str = rq_fast_queue.name
     
@@ -134,7 +132,7 @@ def execute(self, *, accessions: List[str], node: Union[DicomTarget, DicomWebTar
 
 
 @dataclass
-class GetAccessionJob(ClassBasedRQJob):
+class GetAccessionTask(ClassBasedRQTask):
     type: str = "get_accession"
     paused: bool = False
     offpeak: bool = False
@@ -194,7 +192,7 @@ def execute(self, *, accession:str, node: Union[DicomTarget, DicomWebTarget], se
         return "Job complete"
 
 @dataclass
-class MainJob(ClassBasedRQJob):
+class MainTask(ClassBasedRQTask):
     type: str = "batch" 
     started: int = 0
     completed: int = 0
@@ -230,7 +228,7 @@ def execute(self, *, accessions, subjobs, path, destination, move_promptly) -> s
 
         return "Job complete"
 
-class WrappedJob():
+class QueryPipeline():
     job: Job
     def __init__(self, job: Union[Job,str]):
         if isinstance(job, str):
@@ -243,17 +241,17 @@ def __init__(self, job: Union[Job,str]):
         assert self.job.meta.get('type') == 'batch', f"Job type must be batch, got {self.job.meta['type']}"
 
     @classmethod
-    def create(cls, accessions, search_filters:Dict[str, List[str]], dicom_node: Union[DicomWebTarget, DicomTarget], destination_path, offpeak=False) -> 'WrappedJob':
+    def create(cls, accessions: List[str], search_filters:Dict[str, List[str]], dicom_node: Union[DicomWebTarget, DicomTarget], destination_path, offpeak=False) -> 'QueryPipeline':
         """
         Create a job to process the given accessions and store them in the specified destination path.
         """
 
         with Connection(redis):
             get_accession_jobs: List[Job] = []
-            check_job = CheckAccessionsJob().create(accessions=accessions, search_filters=search_filters, node=dicom_node)
+            check_job = CheckAccessionsTask().create_job(accessions=accessions, search_filters=search_filters, node=dicom_node)
             for accession in accessions:
-                job = GetAccessionJob(offpeak=offpeak).create(
-                    accession=accession, 
+                get_accession_task = GetAccessionTask(offpeak=offpeak).create_job(
+                    accession=str(accession), 
                     node=dicom_node,
                     search_filters=search_filters,
                     rq_options=dict(
@@ -262,32 +260,32 @@ def create(cls, accessions, search_filters:Dict[str, List[str]], dicom_node: Uni
                         result_ttl=-1
                         )
                     )
-                get_accession_jobs.append(job)
+                get_accession_jobs.append(get_accession_task)
             depends = Dependency(
                 jobs=cast(List[Union[Job,str]],get_accession_jobs),
                 allow_failure=True,    # allow_failure defaults to False
             )
-            full_job = MainJob(total=len(get_accession_jobs), offpeak=offpeak).create(
+            main_job = MainTask(total=len(get_accession_jobs), offpeak=offpeak).create_job(
                 accessions = accessions,
-                subjobs = [j.id for j in get_accession_jobs],
+                subjobs = [check_job.id]+[j.id for j in get_accession_jobs],
                 destination = destination_path,
                 move_promptly = True,
                 rq_options = dict(depends_on=depends, timeout=-1, result_ttl=-1)
             )
-            check_job.meta["parent"] = full_job.id
+            check_job.meta["parent"] = main_job.id
             for j in get_accession_jobs:
-                j.meta["parent"] = full_job.id
-                j.kwargs["path"] = Path(config.mercure.jobs_folder) / full_job.id / j.kwargs['accession']
+                j.meta["parent"] = main_job.id
+                j.kwargs["path"] = Path(config.mercure.jobs_folder) / str(main_job.id) / j.kwargs['accession']
                 j.kwargs["path"].mkdir(parents=True)
 
-            full_job.kwargs["path"] = Path(config.mercure.jobs_folder) / full_job.id
+            main_job.kwargs["path"] = Path(config.mercure.jobs_folder) / str(main_job.id)
 
-        CheckAccessionsJob.queue().enqueue_job(check_job)
+        CheckAccessionsTask.queue().enqueue_job(check_job)
         for j in get_accession_jobs:
-            GetAccessionJob.queue().enqueue_job(j)
-        MainJob.queue().enqueue_job(full_job)
+            GetAccessionTask.queue().enqueue_job(j)
+        MainTask.queue().enqueue_job(main_job)
 
-        wrapped_job = WrappedJob(full_job)
+        wrapped_job = cls(main_job)
         if offpeak and not _is_offpeak(config.mercure.offpeak_start, config.mercure.offpeak_end, datetime.now().time()):
             wrapped_job.pause()
 
@@ -303,6 +301,7 @@ def pause(self) -> None:
         for job_id in self.job.kwargs.get('subjobs',[]):
             subjob = Job.fetch(job_id)
             if subjob and (subjob.is_deferred or subjob.is_queued):
+                logger.debug(f"Pausing {subjob}")
                 subjob.meta['paused'] = True
                 subjob.save_meta() # type: ignore
                 subjob.cancel()
@@ -341,15 +340,15 @@ def retry(self) -> None:
         Queue(self.job.origin).enqueue_job(self.job)
 
     @classmethod
-    def update_all_jobs_offpeak(cls) -> None:
+    def update_all_offpeak(cls) -> None:
         """
         Resume or pause offpeak jobs based on whether the current time is within offpeak hours.
         """
         config.read_config()
         is_offpeak = _is_offpeak(config.mercure.offpeak_start, config.mercure.offpeak_end, datetime.now().time())
         logger.info(f"is_offpeak {is_offpeak}")
-        for job in WrappedJob.get_all_jobs():
-            job.update_offpeak(is_offpeak)
+        for pipeline in QueryPipeline.get_all():
+            pipeline.update_offpeak(is_offpeak)
 
     def update_offpeak(self, is_offpeak) -> None:
         if not self.meta.get("offpeak"):
@@ -413,7 +412,7 @@ def enqueued_at(self) -> datetime:
         return cast(datetime,self.job.enqueued_at)
 
     @classmethod
-    def get_all_jobs(cls, type:str="batch") -> Generator['WrappedJob', None, None]:
+    def get_all(cls, type:str="batch") -> Generator['QueryPipeline', None, None]:
         """
         Get all jobs of a given type from the queue
         """
@@ -433,7 +432,7 @@ def get_all_jobs(cls, type:str="batch") -> Generator['WrappedJob', None, None]:
             job_ids.add(j_id)
         jobs = (Job.fetch(j_id) for j_id in job_ids)
 
-        return (WrappedJob(j) for j in jobs if j and j.get_meta().get("type") == type)
+        return (QueryPipeline(j) for j in jobs if j and j.get_meta().get("type") == type)
 
 def _is_offpeak(offpeak_start: str, offpeak_end: str, current_time) -> bool:
     try:
diff --git a/webinterface/dashboards/query_routes.py b/webinterface/dashboards/query_routes.py
index 24fa7e19..abeffc7d 100644
--- a/webinterface/dashboards/query_routes.py
+++ b/webinterface/dashboards/query_routes.py
@@ -1,40 +1,36 @@
 
-from dataclasses import dataclass
-from pathlib import Path
 from typing import Any, Dict, List
-
-from common.types import DicomTarget, DicomWebTarget, FolderTarget
-from dispatch.target_types.registry import get_handler
-# Standard python includes
 from datetime import datetime
+
 # Starlette-related includes
 from starlette.authentication import requires
+from starlette.responses import PlainTextResponse, JSONResponse
+
+from rq.job import Job
+from rq import Connection
 
 # App-specific includes
 from webinterface.common import templates
 import common.config as config
-from starlette.responses import PlainTextResponse, JSONResponse
-from webinterface.common import redis
-from rq.job import Job
-from rq import Connection
+from common.types import DicomTarget, DicomWebTarget, FolderTarget
 
+from webinterface.common import redis
 from .common import router
+from .query.jobs import CheckAccessionsTask, QueryPipeline
 
 logger = config.get_logger()
-
-from .query.jobs import CheckAccessionsJob, WrappedJob
  
 @router.post("/query/retry_job")
 @requires(["authenticated", "admin"], redirect="login")
 async def post_retry_job(request):
-    job = WrappedJob(request.query_params['id'])
+    job = QueryPipeline(request.query_params['id'])
     job.retry()
     return JSONResponse({})
 
 @router.post("/query/pause_job")
 @requires(["authenticated", "admin"], redirect="login")
 async def post_pause_job(request):
-    job = WrappedJob(request.query_params['id'])
+    job = QueryPipeline(request.query_params['id'])
     if not job:
         return JSONResponse({'error': 'Job not found'}, status_code=404)
     if job.is_finished or job.is_failed:
@@ -45,7 +41,7 @@ async def post_pause_job(request):
 @router.post("/query/resume_job")
 @requires(["authenticated", "admin"], redirect="login")
 async def post_resume_job(request):
-    job = WrappedJob(request.query_params['id'])
+    job = QueryPipeline(request.query_params['id'])
     if not job:
         return JSONResponse({'error': 'Job not found'}, status_code=404)
     if job.is_finished or job.is_failed:
@@ -58,7 +54,7 @@ async def post_resume_job(request):
 @requires(["authenticated", "admin"], redirect="login")
 async def get_job_info(request):
     job_id = request.query_params['id']
-    job = WrappedJob(job_id)
+    job = QueryPipeline(job_id)
     if not job:
         return JSONResponse({'error': 'Job not found'}, status_code=404)
     
@@ -110,7 +106,7 @@ async def query_post_batch(request):
     if search_filter:= form.get("study_description"):
         search_filters["StudyDescription"] =  [x.strip() for x in search_filter.split(",")]
 
-    WrappedJob.create(form.get("accession").split(","), search_filters, node, dest_path, offpeak=offpeak)
+    QueryPipeline.create(form.get("accession").split(","), search_filters, node, dest_path, offpeak=offpeak)
     # worker_scheduler.schedule(scheduled_time=datetime.utcnow(), func=monitor_job, interval=10, repeat=10, result_ttl=-1)
     return PlainTextResponse()
  
@@ -136,56 +132,55 @@ async def query_jobs(request):
     """
     Returns a list of all query jobs. 
     """
-    job_info = []
+    tasks_info = []
     with Connection(redis):
-        jobs = list(WrappedJob.get_all_jobs())
-
-    for job in jobs:
-        job_dict = dict(id=job.id, 
-                                status=job.get_status(), 
-                                parameters=dict(accession=job.kwargs.get('accession','')), 
-                                created_at=1000*datetime.timestamp(job.created_at) if job.created_at else "",
-                                enqueued_at=1000*datetime.timestamp(job.enqueued_at) if job.enqueued_at else "", 
-                                result=job.result if job.get_status() != "failed" else job.meta.get("failed_reason",""), 
-                                meta=job.meta,
+        query_tasks = list(QueryPipeline.get_all())
+
+    for task in query_tasks:
+        task_dict: Dict[str,Any] = dict(id=task.id, 
+                                status=task.get_status(), 
+                                parameters=dict(accession=task.kwargs.get('accession','')), 
+                                created_at=1000*datetime.timestamp(task.created_at) if task.created_at else "",
+                                enqueued_at=1000*datetime.timestamp(task.enqueued_at) if task.enqueued_at else "", 
+                                result=task.result if task.get_status() != "failed" else task.meta.get("failed_reason",""), 
+                                meta=task.meta,
                                 progress="")
         # if job.meta.get('completed') and job.meta.get('remaining'):
-        #     job_dict["progress"] = f"{job.meta.get('completed')} / {job.meta.get('completed') + job.meta.get('remaining')}"
+        #     task_dict["progress"] = f"{job.meta.get('completed')} / {job.meta.get('completed') + job.meta.get('remaining')}"
         # if job.meta.get('type',None) == "batch":
-        n_started = job.meta.get('started',0)
-        n_completed = job.meta.get('completed',0)
-        n_total = job.meta.get('total',0)
-
-        if job_dict["status"] == "finished":
-            job_dict["progress"] = f"{n_total} / {n_total}"
-        elif job_dict["status"] in ("deferred","started", "paused", "canceled"):
-            job_dict["progress"] = f"{n_completed} / {n_total}"
+        n_started = task.meta.get('started',0)
+        n_completed = task.meta.get('completed',0)
+        n_total = task.meta.get('total',0)
+
+        if task_dict["status"] == "finished":
+            task_dict["progress"] = f"{n_total} / {n_total}"
+        elif task_dict["status"] in ("deferred","started", "paused", "canceled"):
+            task_dict["progress"] = f"{n_completed} / {n_total}"
         
-        # if job_dict["status"] == "canceled" and 
-        if job_dict["meta"].get('paused', False) and job_dict["status"] not in ("finished", "failed"):
+        # if task_dict["status"] == "canceled" and 
+        if task.meta.get('paused', False) and task_dict["status"] not in ("finished", "failed"):
             if n_started < n_completed: # TODO: this does not work
-                job_dict["status"] = "pausing"
+                task_dict["status"] = "pausing"
             else:
-                job_dict["status"] = "paused"
+                task_dict["status"] = "paused"
 
-        if job_dict["status"] in ("deferred", "started"):
+        if task_dict["status"] in ("deferred", "started"):
             if n_started == 0:
-                job_dict["status"] = "waiting"
+                task_dict["status"] = "waiting"
             elif n_completed < n_total:
-                job_dict["status"] = "running" 
+                task_dict["status"] = "running" 
             elif n_completed == n_total:
-                job_dict["status"] = "finishing" 
+                task_dict["status"] = "finishing" 
 
-        job_info.append(job_dict)
-    return JSONResponse(dict(data=job_info))
-    # return PlainTextResponse(",".join([str(j) for j in all_jobs]))
+        tasks_info.append(task_dict)
+    return JSONResponse(dict(data=tasks_info))
 
 @router.get("/query")
 @requires(["authenticated", "admin"], redirect="login")
 async def query(request):
     template = "dashboards/query.html"
-    dicom_nodes = [name for name,node in config.mercure.targets.items() if type(node) in (DicomTarget, DicomWebTarget) and node.direction in ("pull", "both")]
-    destination_folders = [name for name,node in config.mercure.targets.items() if type(node) == FolderTarget]
+    dicom_nodes = [name for name,node in config.mercure.targets.items() if isinstance(node, (DicomTarget, DicomWebTarget)) and node.direction in ("pull", "both")]
+    destination_folders = [name for name,node in config.mercure.targets.items() if isinstance(node, FolderTarget)]
     context = {
         "request": request,
         "destination_folders": destination_folders,
@@ -224,9 +219,6 @@ async def check_accessions(request):
     node_name = form.get("dicom_node")
     accessions = form.get("accessions", "").split(",")
     
-    series_descriptions = form.get("series_descriptions")
-    study_descriptions = form.get("study_descriptions")
-
     search_filters = {}
     if search_filter:= form.get("series_description"):
         search_filters["SeriesDescription"] = [x.strip() for x in search_filter.split(",")]
@@ -238,6 +230,6 @@ async def check_accessions(request):
         return JSONResponse({"error": f"Invalid DICOM node"}, status_code=400)
     
     with Connection(redis):
-        job = CheckAccessionsJob().create(accessions=accessions, node=node, search_filters=search_filters)
-        CheckAccessionsJob.queue().enqueue_job(job)
+        job = CheckAccessionsTask().create_job(accessions=accessions, node=node, search_filters=search_filters)
+        CheckAccessionsTask.queue().enqueue_job(job)
     return JSONResponse({"status": "pending", "job_id": job.id})
\ No newline at end of file

From c7f12a1dc5d198702426a1beaabc71376a80fc25 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 13 Sep 2024 22:42:23 +0000
Subject: [PATCH 38/42] add test

---
 tests/test_query.py                   | 40 ++++++++++++++++++++++++---
 webinterface/dashboards/query/jobs.py | 21 +++-----------
 2 files changed, 40 insertions(+), 21 deletions(-)

diff --git a/tests/test_query.py b/tests/test_query.py
index 1bd075a9..18558ae9 100644
--- a/tests/test_query.py
+++ b/tests/test_query.py
@@ -1,7 +1,7 @@
 import os
 from pathlib import Path
 import tempfile
-from typing import Dict
+from typing import Dict, Optional
 import pydicom
 import pytest
 from pynetdicom import AE, evt, StoragePresentationContexts, build_role
@@ -23,7 +23,7 @@
 
 getLogger('pynetdicom').setLevel('WARNING')
 # Mock data for testing
-MOCK_ACCESSIONS = ["12345"]
+MOCK_ACCESSIONS = ["1","2","3"]
 
 
 @pytest.fixture(scope="module", autouse=True)
@@ -36,6 +36,7 @@ def mock_node(receiver_port):
     return DicomTarget(ip="127.0.0.1", port=str(receiver_port), aet_target="TEST")
 
 class DummyDICOMServer:
+    remaining_allowed_accessions: Optional[int] = None
     """A simple DICOM server for testing purposes."""
     def __init__(self, port:int, datasets: Dict[str,Dataset]):
         assert isinstance(port, int), "Port must be an integer"
@@ -61,7 +62,8 @@ def handle_get(event):
             ds = event.identifier
             # yield 1
             # Check if the request matches our dummy data
-            if 'AccessionNumber' in ds and ds.AccessionNumber in MOCK_ACCESSIONS:
+            if 'AccessionNumber' in ds and ds.AccessionNumber in MOCK_ACCESSIONS \
+                    and ( self.remaining_allowed_accessions is None or  self.remaining_allowed_accessions > 0 ):
                 # Create a dummy DICOM dataset
                 yield 1
 
@@ -72,8 +74,11 @@ def handle_get(event):
                 dummy_ds.file_meta.TransferSyntaxUID = ExplicitVRLittleEndian
 
                 # Yield the dataset
+                if self.remaining_allowed_accessions:
+                    self.remaining_allowed_accessions = self.remaining_allowed_accessions - 1
                 yield (0xFF00, dummy_ds)
             else:
+                yield 0
                 yield (0x0000, None)  # Status 'Success', but no match
         # Bind the C-FIND handler
 
@@ -123,6 +128,17 @@ def dicom_server(mock_node, dummy_datasets):
     yield mock_node
     server.stop()
 
+@pytest.fixture(scope="function")
+def dicom_server_2(mock_node, dummy_datasets):
+    """
+    Pytest fixture to start a DICOM server before tests and stop it after.
+    This fixture has module scope, so the server will be started once for all tests in the module.
+    """
+    server = DummyDICOMServer(int(mock_node.port), dummy_datasets)
+    yield mock_node, server
+    server.stop()
+
+
 @pytest.fixture(scope="function")
 def dicomweb_server(dummy_datasets, tempdir):
     (tempdir / "dicomweb").mkdir()
@@ -213,7 +229,7 @@ def test_query_operations(dicomweb_server, tempdir, dummy_datasets, fs, rq_conne
     assert task
     assert task.meta['total'] == len(dummy_datasets)
     assert task.meta['completed'] == 0
-    task.pause()
+    task.pause()    
     for job in (jobs:=task.get_subjobs()):
         assert job.meta.get("paused")
         assert job.get_status() == "canceled"
@@ -238,3 +254,19 @@ def test_query_operations(dicomweb_server, tempdir, dummy_datasets, fs, rq_conne
     task.get_meta()
     assert task.meta['completed'] == len(dummy_datasets)
     assert task.meta['total'] == len(dummy_datasets)
+
+def test_query_retry(dicom_server_2: tuple[DicomTarget,DummyDICOMServer], tempdir, dummy_datasets, fs, rq_connection):
+    (tempdir / "outdir").mkdir()
+    target, server = dicom_server_2
+    task = QueryPipeline.create([ds.AccessionNumber for ds in dummy_datasets.values()], {}, target, (tempdir / "outdir"))
+    server.remaining_allowed_accessions = 1
+    w = SimpleWorker(["mercure_fast", "mercure_slow"], connection=redis)
+    w.work(burst=True)
+    task.get_meta()
+    assert task.meta['completed'] == 1
+    assert task.meta['total'] == len(dummy_datasets)
+    server.remaining_allowed_accessions = None
+    task.retry()
+    w.work(burst=True)
+    task.get_meta()
+    assert task.meta['completed'] == len(dummy_datasets)
\ No newline at end of file
diff --git a/webinterface/dashboards/query/jobs.py b/webinterface/dashboards/query/jobs.py
index 3d074918..a8af2f2f 100644
--- a/webinterface/dashboards/query/jobs.py
+++ b/webinterface/dashboards/query/jobs.py
@@ -9,6 +9,7 @@
 import typing
 
 
+from common import helper
 from common.types import DicomTarget, DicomWebTarget, FolderTarget
 from dispatch.target_types.base import ProgressInfo
 from dispatch.target_types.registry import get_handler
@@ -286,7 +287,7 @@ def create(cls, accessions: List[str], search_filters:Dict[str, List[str]], dico
         MainTask.queue().enqueue_job(main_job)
 
         wrapped_job = cls(main_job)
-        if offpeak and not _is_offpeak(config.mercure.offpeak_start, config.mercure.offpeak_end, datetime.now().time()):
+        if offpeak and not helper._is_offpeak(config.mercure.offpeak_start, config.mercure.offpeak_end, datetime.now().time()):
             wrapped_job.pause()
 
         return wrapped_job
@@ -332,7 +333,7 @@ def retry(self) -> None:
         #     return False
         logger.info(f"Retrying {self.job}")
         for subjob in self.get_subjobs():
-            if (status:=self.job.get_status()) in ("failed", "canceled"):
+            if (status:=subjob.get_status()) in ("failed", "canceled"):
                 logger.info(f"Retrying {subjob}")
                 if status == "failed" and (job_path:=Path(subjob.kwargs['path'])).exists():
                     shutil.rmtree(job_path) # Clean up after a failed job
@@ -345,8 +346,7 @@ def update_all_offpeak(cls) -> None:
         Resume or pause offpeak jobs based on whether the current time is within offpeak hours.
         """
         config.read_config()
-        is_offpeak = _is_offpeak(config.mercure.offpeak_start, config.mercure.offpeak_end, datetime.now().time())
-        logger.info(f"is_offpeak {is_offpeak}")
+        is_offpeak = helper._is_offpeak(config.mercure.offpeak_start, config.mercure.offpeak_end, datetime.now().time())
         for pipeline in QueryPipeline.get_all():
             pipeline.update_offpeak(is_offpeak)
 
@@ -433,16 +433,3 @@ def get_all(cls, type:str="batch") -> Generator['QueryPipeline', None, None]:
         jobs = (Job.fetch(j_id) for j_id in job_ids)
 
         return (QueryPipeline(j) for j in jobs if j and j.get_meta().get("type") == type)
-
-def _is_offpeak(offpeak_start: str, offpeak_end: str, current_time) -> bool:
-    try:
-        start_time = datetime.strptime(offpeak_start, "%H:%M").time()
-        end_time = datetime.strptime(offpeak_end, "%H:%M").time()
-    except Exception as e:
-        logger.error(f"Unable to parse offpeak time: {offpeak_start}, {offpeak_end}", None)  # handle_error
-        return True
-
-    if start_time < end_time:
-        return bool(current_time >= start_time and current_time <= end_time)
-    # End time is after midnight
-    return bool(current_time >= start_time or current_time <= end_time)

From 59040dbf110fd93266ce911d472b39b56668e645 Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Thu, 26 Sep 2024 22:24:20 +0000
Subject: [PATCH 39/42] query error handling

---
 dispatch/target_types/dicomweb.py       |   4 +-
 tests/test_query.py                     |  10 +-
 webgui.py                               |   2 +-
 webinterface/dashboards/common.py       |   9 +-
 webinterface/dashboards/query/jobs.py   |  91 +++++++-----
 webinterface/dashboards/query_routes.py | 184 ++++++++++++++----------
 webinterface/rules.py                   |   2 +-
 7 files changed, 184 insertions(+), 118 deletions(-)

diff --git a/dispatch/target_types/dicomweb.py b/dispatch/target_types/dicomweb.py
index ab7fa025..0f85a1ee 100644
--- a/dispatch/target_types/dicomweb.py
+++ b/dispatch/target_types/dicomweb.py
@@ -71,7 +71,7 @@ def find_from_target(self, target: DicomWebTarget, accession: str, search_filter
         else:
             use_filters.update({k: v[0] for k,v in search_filters.items()})
         
-        metadata = client.search_for_series(search_filters=use_filters, get_remaining=True, fields=['StudyInstanceUID', 'SeriesInstanceUID', 'NumberOfSeriesRelatedInstances'] + list(search_filters.keys()))
+        metadata = client.search_for_series(search_filters=use_filters, get_remaining=True, fields=['StudyInstanceUID', 'SeriesInstanceUID', 'NumberOfSeriesRelatedInstances', 'StudyDescription', 'SeriesDescription'] + list(search_filters.keys()))
         meta_datasets = [pydicom.Dataset.from_json(ds) for ds in metadata]
         result = []
         
@@ -82,7 +82,7 @@ def find_from_target(self, target: DicomWebTarget, accession: str, search_filter
                     break
             else:
                 result.append(d)
-        print(result)
+        logger.debug(result)
         return result
 
     def get_from_target(self, target: DicomWebTarget, accession, search_filters, path) -> Generator[ProgressInfo, None, None]:
diff --git a/tests/test_query.py b/tests/test_query.py
index 18558ae9..880b7dee 100644
--- a/tests/test_query.py
+++ b/tests/test_query.py
@@ -246,7 +246,7 @@ def test_query_operations(dicomweb_server, tempdir, dummy_datasets, fs, rq_conne
     for job in task.get_subjobs():
         assert not job.meta.get("paused")
         assert job.get_status() == "queued"
-    w = SimpleWorker(["mercure_fast", "mercure_slow"], connection=redis)
+
     w.work(burst=True)
     for ds in dummy_datasets.values():
         outfile = (tempdir / "outdir" / task.id / ds.AccessionNumber /  f"{ds.SOPInstanceUID}.dcm")
@@ -259,14 +259,18 @@ def test_query_retry(dicom_server_2: tuple[DicomTarget,DummyDICOMServer], tempdi
     (tempdir / "outdir").mkdir()
     target, server = dicom_server_2
     task = QueryPipeline.create([ds.AccessionNumber for ds in dummy_datasets.values()], {}, target, (tempdir / "outdir"))
-    server.remaining_allowed_accessions = 1
+
+    server.remaining_allowed_accessions = 1 # Only one accession is allowed to be retrieved
     w = SimpleWorker(["mercure_fast", "mercure_slow"], connection=redis)
     w.work(burst=True)
     task.get_meta()
     assert task.meta['completed'] == 1
     assert task.meta['total'] == len(dummy_datasets)
+    assert "Failed to retrieve accession" in task.meta['failed_reason']
+    # Retry the query
     server.remaining_allowed_accessions = None
     task.retry()
     w.work(burst=True)
     task.get_meta()
-    assert task.meta['completed'] == len(dummy_datasets)
\ No newline at end of file
+    assert task.meta['completed'] == len(dummy_datasets)
+    assert task.meta['failed_reason'] is None
\ No newline at end of file
diff --git a/webgui.py b/webgui.py
index 6b4ada4a..f905acdb 100755
--- a/webgui.py
+++ b/webgui.py
@@ -905,7 +905,7 @@ async def server_error(request, exc) -> Response:
 app.mount("/static", StaticFiles(directory="webinterface/statics", check_dir=False), name="static")
 app.add_middleware(AuthenticationMiddleware, backend=SessionAuthBackend())
 app.add_middleware(SessionMiddleware, secret_key=SECRET_KEY, session_cookie="mercure_session")
-app.mount("/rules", rules.rules_app)
+app.mount("/rules", rules.rules_app, name="rules")
 app.mount("/targets", targets.targets_app)
 app.mount("/modules", modules.modules_app)
 app.mount("/users", users.users_app)
diff --git a/webinterface/dashboards/common.py b/webinterface/dashboards/common.py
index f4eae329..09dc9068 100644
--- a/webinterface/dashboards/common.py
+++ b/webinterface/dashboards/common.py
@@ -1,7 +1,12 @@
 from decoRouter import Router as decoRouter
-from starlette.responses import RedirectResponse
+from starlette.responses import RedirectResponse, JSONResponse
 
 router = decoRouter()
+
 @router.get("/")
 async def index(request):
-    return RedirectResponse(url="tests")
\ No newline at end of file
+    return RedirectResponse(url="query")
+
+class JSONErrorResponse(JSONResponse):
+    def __init__(self, message: str, status_code: int = 500):
+        super().__init__(content={"error": message}, status_code=status_code)
\ No newline at end of file
diff --git a/webinterface/dashboards/query/jobs.py b/webinterface/dashboards/query/jobs.py
index a8af2f2f..7bbcd5f7 100644
--- a/webinterface/dashboards/query/jobs.py
+++ b/webinterface/dashboards/query/jobs.py
@@ -109,8 +109,6 @@ def execute(self, *, accessions: List[str], node: Union[DicomTarget, DicomWebTar
         """
         Check if the given accessions exist on the node using a DICOM query.
         """
-        # c = SimpleDicomClient(node.ip, node.port, node.aet_target, None)
-        # assert self.parent is not None
         results = []
         try:
             for accession in accessions:
@@ -128,7 +126,6 @@ def execute(self, *, accessions: List[str], node: Union[DicomTarget, DicomWebTar
                 job_parent.meta['failed_reason'] = e.args[0]
                 job_parent.save_meta() # type: ignore
                 Queue(job_parent.origin)._enqueue_job(job_parent,at_front=True)
-
             raise
 
 
@@ -145,6 +142,24 @@ def get_accession(cls, job_id, accession: str, node: Union[DicomTarget, DicomWeb
 
     def execute(self, *, accession:str, node: Union[DicomTarget, DicomWebTarget], search_filters:Dict[str, List[str]], path: str):
         print(f"Getting {accession}")
+        def error_handler(reason):
+            logger.error(reason)
+            if not job_parent:
+                raise
+            logger.info("Cancelling sibling jobs.")
+            for subjob_id in job_parent.kwargs.get('subjobs',[]):
+                if subjob_id == job.id:
+                    continue
+                subjob = Job.fetch(subjob_id)
+                if subjob.get_status() not in ('finished', 'canceled','failed'):
+                    subjob.cancel()
+            job_parent.get_meta() 
+            logger.info("Cancelled sibling jobs.")
+            if not job_parent.meta.get("failed_reason"):
+                job_parent.meta["failed_reason"] = reason
+                job_parent.save_meta()
+                Queue(job_parent.origin)._enqueue_job(job_parent,at_front=True) # Force the parent job to run and fail itself
+
         job = cast(Job,self._job)
         try:
             Path(path).mkdir(parents=True, exist_ok=True)
@@ -159,35 +174,31 @@ def execute(self, *, accession:str, node: Union[DicomTarget, DicomWebTarget], se
             job.meta['started'] = 1
             job.meta['progress'] = "0 / Unknown"
             job.save_meta() # type: ignore
-            for info in self.get_accession(job.id, accession=accession, node=node, search_filters=search_filters, path=path):
-                job.meta['remaining'] = info.remaining
-                job.meta['completed'] = info.completed 
-                job.meta['progress'] = info.progress
-                job.save_meta() # type: ignore  # Save the updated meta data to the job
-                logger.info(info.progress)
+            try:
+                for info in self.get_accession(job.id, accession=accession, node=node, search_filters=search_filters, path=path):
+                    job.meta['remaining'] = info.remaining
+                    job.meta['completed'] = info.completed 
+                    job.meta['progress'] = info.progress
+                    job.save_meta() # type: ignore  # Save the updated meta data to the job
+                    logger.info(info.progress)
+            except Exception as e:
+                error_handler(f"Failure during retrieval of accession {accession}: {e}")
+                raise
             if job_parent:
                 if job_parent.kwargs["move_promptly"]:
-                    self.move_to_destination(path, job_parent.kwargs["destination"], job_parent.id)
-
+                    try:
+                        self.move_to_destination(path, job_parent.kwargs["destination"], job_parent.id)
+                    except Exception as e:
+                        error_handler(f"Failure during move to destination of accession {accession}: {e}")
+                        raise
+                        
                 job_parent.get_meta() # there is technically a race condition here...
                 job_parent.meta['completed'] += 1
                 job_parent.meta['progress'] = f"{job_parent.meta['started'] } / {job_parent.meta['completed'] } / {job_parent.meta['total']}"
                 job_parent.save_meta() # type: ignore
-        except:
-            if not job_parent:
-                raise
-            # Cancel remaining sibling jobs
-            logger.info("Cancelling sibling jobs.")
-            for subjob_id in job_parent.kwargs.get('subjobs',[]):
-                if subjob_id == job.id:
-                    continue
-                subjob = Job.fetch(subjob_id)
-                if subjob.get_status() not in ('finished', 'canceled','failed'):
-                    subjob.cancel()
-            job_parent.get_meta() 
-            logger.info("Cancelled sibling jobs.")
-            job_parent.meta["failed_reason"] = f"Failed to retrieve {accession}"
-            Queue(job_parent.origin)._enqueue_job(job_parent,at_front=True) # Force the parent job to run and fail itself
+            
+        except Exception as e:
+            error_handler(f"Failure with accession {accession}: {e}")
             raise
 
         return "Job complete"
@@ -200,7 +211,7 @@ class MainTask(ClassBasedRQTask):
     total: int = 0
     paused: bool = False 
     offpeak: bool = False
-    _queue: str = rq_fast_queue.name
+    _queue: str = rq_slow_queue.name
 
     def execute(self, *, accessions, subjobs, path, destination, move_promptly) -> str:
         job = cast(Job,self._job)
@@ -213,19 +224,25 @@ def execute(self, *, accessions, subjobs, path, destination, move_promptly) -> s
                 raise Exception(f"Failed")
 
         logger.info(f"Job completing {job.id}")
-
         if not move_promptly:
             logger.info("Moving files during completion as move_promptly==False")
             for p in Path(path).iterdir():
                 if not p.is_dir():
                     continue
-                self.move_to_destination(p, destination, job.id)
-
+                try:
+                    self.move_to_destination(p, destination, job.id)
+                except Exception as e:
+                    err = f"Failure during move to destination {destination}: {e}" if destination else f"Failure during move to {config.mercure.incoming_folder}: {e}"
+                    logger.error(err)
+                    job.meta["failed_reason"] = err
+                    job.save_meta()
+                    raise
         # subprocess.run(["./bin/ubuntu22.04/getdcmtags", filename, self.called_aet, "MERCURE"],check=True)
 
         logger.info(f"Removing job directory {path}")
-        # tree(destination)
         shutil.rmtree(path)
+        job.meta["failed_reason"] = None
+        job.save_meta()
 
         return "Job complete"
 
@@ -333,8 +350,9 @@ def retry(self) -> None:
         #     return False
         logger.info(f"Retrying {self.job}")
         for subjob in self.get_subjobs():
+            meta = subjob.get_meta()
             if (status:=subjob.get_status()) in ("failed", "canceled"):
-                logger.info(f"Retrying {subjob}")
+                logger.info(f"Retrying {subjob} ({status}) {meta}")
                 if status == "failed" and (job_path:=Path(subjob.kwargs['path'])).exists():
                     shutil.rmtree(job_path) # Clean up after a failed job
                 Queue(subjob.origin).enqueue_job(subjob)
@@ -367,7 +385,7 @@ def update_offpeak(self, is_offpeak) -> None:
                 self.pause()
 
     def get_subjobs(self) -> Generator[Job, None, None]:
-        return (Job.fetch(job) for job in self.job.kwargs.get('subjobs', []) if job)
+        return (j for j in (Queue(self.job.origin).fetch_job(job) for job in self.job.kwargs.get('subjobs', [])) if j is not None)
 
     def get_status(self) -> JobStatus:
         return cast(JobStatus,self.job.get_status())
@@ -416,6 +434,8 @@ def get_all(cls, type:str="batch") -> Generator['QueryPipeline', None, None]:
         """
         Get all jobs of a given type from the queue
         """
+        job_ids = set()
+
         registries = [
             rq_slow_queue.started_job_registry,     # Returns StartedJobRegistry
             rq_slow_queue.deferred_job_registry,    # Returns DeferredJobRegistry
@@ -424,12 +444,13 @@ def get_all(cls, type:str="batch") -> Generator['QueryPipeline', None, None]:
             rq_slow_queue.scheduled_job_registry,   # Returns ScheduledJobRegistry
             rq_slow_queue.canceled_job_registry,    # Returns CanceledJobRegistry
         ]
-        job_ids = set()
         for registry in registries:
             for j_id in registry.get_job_ids():
                 job_ids.add(j_id)
+
         for j_id in rq_slow_queue.job_ids:
             job_ids.add(j_id)
-        jobs = (Job.fetch(j_id) for j_id in job_ids)
 
+        jobs = (Job.fetch(j_id) for j_id in job_ids)
+        
         return (QueryPipeline(j) for j in jobs if j and j.get_meta().get("type") == type)
diff --git a/webinterface/dashboards/query_routes.py b/webinterface/dashboards/query_routes.py
index abeffc7d..71d0ce79 100644
--- a/webinterface/dashboards/query_routes.py
+++ b/webinterface/dashboards/query_routes.py
@@ -1,10 +1,11 @@
 
+from time import sleep
 from typing import Any, Dict, List
 from datetime import datetime
 
 # Starlette-related includes
 from starlette.authentication import requires
-from starlette.responses import PlainTextResponse, JSONResponse
+from starlette.responses import JSONResponse
 
 from rq.job import Job
 from rq import Connection
@@ -15,7 +16,7 @@
 from common.types import DicomTarget, DicomWebTarget, FolderTarget
 
 from webinterface.common import redis
-from .common import router
+from .common import router, JSONErrorResponse
 from .query.jobs import CheckAccessionsTask, QueryPipeline
 
 logger = config.get_logger()
@@ -23,58 +24,86 @@
 @router.post("/query/retry_job")
 @requires(["authenticated", "admin"], redirect="login")
 async def post_retry_job(request):
-    job = QueryPipeline(request.query_params['id'])
-    job.retry()
+    with Connection(redis):
+        job = QueryPipeline(request.query_params['id'])
+        
+        if not job:
+            return JSONErrorResponse(f"Job with id {request.query_params['id']} not found.", status_code=404)
+        
+        try:
+            job.retry()
+        except Exception as e:
+            logger.exception("Failed to retry job", exc_info=True)
+            return JSONErrorResponse("Failed to retry job",status_code=500)
     return JSONResponse({})
 
 @router.post("/query/pause_job")
 @requires(["authenticated", "admin"], redirect="login")
 async def post_pause_job(request):
-    job = QueryPipeline(request.query_params['id'])
-    if not job:
-        return JSONResponse({'error': 'Job not found'}, status_code=404)
-    if job.is_finished or job.is_failed:
-        return JSONResponse({'error': 'Job is already finished'}, status_code=400)
-    job.pause()
+    with Connection(redis):
+        job = QueryPipeline(request.query_params['id'])
+
+        if not job:
+            return JSONErrorResponse('Job not found', status_code=404)
+        if job.is_finished or job.is_failed:
+            return JSONErrorResponse('Job is already finished', status_code=400)
+
+        try:
+            job.pause()
+        except Exception as e:
+            logger.exception(f"Failed to pause job {request.query_params['id']}")
+            return JSONErrorResponse('Failed to pause job', status_code=500)
     return JSONResponse({'status': 'success'}, status_code=200)
 
 @router.post("/query/resume_job")
 @requires(["authenticated", "admin"], redirect="login")
 async def post_resume_job(request):
-    job = QueryPipeline(request.query_params['id'])
-    if not job:
-        return JSONResponse({'error': 'Job not found'}, status_code=404)
-    if job.is_finished or job.is_failed:
-        return JSONResponse({'error': 'Job is already finished'}, status_code=400)
-    
-    job.resume()
+    with Connection(redis):
+        job = QueryPipeline(request.query_params['id'])
+        if not job:
+            return JSONErrorResponse('Job not found', status_code=404)
+        if job.is_finished or job.is_failed:
+            return JSONErrorResponse('Job is already finished', status_code=400)
+
+        try:
+            job.resume()
+        except Exception as e:
+            logger.exception(f"Failed to resume job {request.query_params['id']}")
+            return JSONErrorResponse('Failed to resume job', status_code=500)
     return JSONResponse({'status': 'success'}, status_code=200)
 
 @router.get("/query/job_info")
 @requires(["authenticated", "admin"], redirect="login")
 async def get_job_info(request):
     job_id = request.query_params['id']
-    job = QueryPipeline(job_id)
-    if not job:
-        return JSONResponse({'error': 'Job not found'}, status_code=404)
-    
-    subjob_info:List[Dict[str,Any]] = []
-    for subjob in job.get_subjobs():
-        if not subjob:
-            continue
-        info = {
-                'id': subjob.get_id(),
-                'ended_at': subjob.ended_at.isoformat().split('.')[0] if subjob.ended_at else "", 
-                'created_at_dt':subjob.created_at,
-                'accession': subjob.kwargs['accession'],
-                'progress': subjob.meta.get('progress'),
-                'paused': subjob.meta.get('paused',False),
-                'status': subjob.get_status()
-            }
-        if info['status'] == 'canceled' and info['paused']:
-            info['status'] = 'paused'
-        subjob_info.append(info)
+    with Connection(redis):
+        job = QueryPipeline(job_id)
+        if not job:
+            return JSONErrorResponse('Job not found', status_code=404)
+        
+        subjob_info:List[Dict[str,Any]] = []
+        for subjob in job.get_subjobs():
+            if not subjob:
+                continue
+            if subjob.meta.get('type') != 'get_accession':
+                continue
+            info = {
+                    'id': subjob.get_id(),
+                    'ended_at': subjob.ended_at.isoformat().split('.')[0] if subjob.ended_at else "", 
+                    'created_at_dt':subjob.created_at,
+                    'accession': subjob.kwargs['accession'],
+                    'progress': subjob.meta.get('progress'),
+                    'paused': subjob.meta.get('paused',False),
+                    'status': subjob.get_status()
+                }
+            if info['status'] == 'canceled' and info['paused']:
+                info['status'] = 'paused'
+            subjob_info.append(info)
+
     subjob_info = sorted(subjob_info, key=lambda x:x['created_at_dt'])
+
+    # generate a bunch of dummy data for testing purposes
+
     return templates.TemplateResponse("dashboards/query_job_fragment.html", {"request":request,"job":job,"subjob_info":subjob_info})
 
 
@@ -85,46 +114,45 @@ async def query_post_batch(request):
     """
     Starts a new query job for the given accession number and DICOM node.
     """
-    form = await request.form()
+    try:
+        form = await request.form()
+    except Exception as e:
+        return JSONErrorResponse("Invalid form data.", status_code=400)
+    accession = form.get("accession")
+    if not accession:
+        return JSONErrorResponse("Accession number is required.", status_code=400)
 
     node = config.mercure.targets.get(form.get("dicom_node"))
+    if not node:
+        return JSONErrorResponse(f"No such DICOM node {form.get('dicom_node')}.", status_code=404)
     if not isinstance(node, (DicomWebTarget, DicomTarget)):
-        return JSONResponse({"error": f"Invalid DICOM node"}, status_code=400)
+        return JSONErrorResponse(f"Invalid DICOM node {form.get('dicom_node')}.", status_code=400)
 
-    destination = config.mercure.targets.get(form.get("destination"))
-    if destination and isinstance(destination, FolderTarget):
-        dest_path = destination.folder
+    destination_name = form.get("destination")
+    if not destination_name:
+        destination_path = None
     else:
-        return JSONResponse({"error": "Invalid destination"}, status_code=400)
-    # random_accessions = ["".join(random.choices([str(i) for i in range(10)], k=10)) for _ in range(3)]
-    offpeak = 'offpeak' in form
-
+        destination = config.mercure.targets.get(destination_name)
+        if not isinstance(destination, FolderTarget):
+            return JSONErrorResponse(f"Invalid destination '{destination_name}': not a folder target.", status_code=400)
+        if not destination:
+            return JSONErrorResponse(f"No such target '{destination_name}'.", status_code=400)
+        destination_path = destination.folder
 
+    offpeak = 'offpeak' in form
     search_filters = {}
-    if search_filter:= form.get("series_description"):
+    if search_filter := form.get("series_description"):
         search_filters["SeriesDescription"] = [x.strip() for x in search_filter.split(",")]
-    if search_filter:= form.get("study_description"):
+    if search_filter := form.get("study_description"):
         search_filters["StudyDescription"] =  [x.strip() for x in search_filter.split(",")]
 
-    QueryPipeline.create(form.get("accession").split(","), search_filters, node, dest_path, offpeak=offpeak)
-    # worker_scheduler.schedule(scheduled_time=datetime.utcnow(), func=monitor_job, interval=10, repeat=10, result_ttl=-1)
-    return PlainTextResponse()
- 
-# @router.post("/query_single")
-# @requires(["authenticated", "admin"], redirect="login")
-# async def query_post(request):
-#     """
-#     Starts a new query job for the given accession number and DICOM node.
-#     """
-#     form = await request.form()
-#     for n in config.mercure.dicom_retrieve.dicom_nodes:
-#         if n.name == form.get("dicom_node"):
-#             node = n
-#             break
-    
-#     worker_queue.enqueue_call(QueryJob.get_accession_job, kwargs=dict(accession=form.get("accession"), node=node), timeout=30*60, result_ttl=-1, meta=dict(type="get_accession_single"))
-#     return PlainTextResponse()
+    try:
+        QueryPipeline.create(accession.split(","), search_filters, node, destination_path, offpeak=offpeak)
+    except Exception as e:
+        logger.exception(f"Error creating query pipeline for accession {accession}.")
+        return JSONErrorResponse(str(e))
 
+    return JSONResponse({"status": "success"})
 
 @router.get("/query/jobs")
 @requires(["authenticated", "admin"], redirect="login")
@@ -133,8 +161,12 @@ async def query_jobs(request):
     Returns a list of all query jobs. 
     """
     tasks_info = []
-    with Connection(redis):
-        query_tasks = list(QueryPipeline.get_all())
+    try:
+        with Connection(redis):
+            query_tasks = list(QueryPipeline.get_all())
+    except Exception as e:
+        logger.exception("Error retrieving query tasks.")
+        return JSONErrorResponse("Error retrieving query tasks.", status_code=500)
 
     for task in query_tasks:
         task_dict: Dict[str,Any] = dict(id=task.id, 
@@ -210,10 +242,9 @@ async def check_accessions(request):
         elif job.is_finished:
             result_data = []
             for d in job.result:
+                logger.info(d)
                 result_data.append( {x:d.get(x) for x in ["AccessionNumber", "PatientID", "StudyInstanceUID", "SeriesInstanceUID", "StudyDescription", "SeriesDescription", "NumberOfSeriesRelatedInstances"]} )
             return JSONResponse({"status": "completed", "result": result_data})
-        
-
         return JSONResponse({"status": "pending", "job_id": job.id})
 
     node_name = form.get("dicom_node")
@@ -227,9 +258,14 @@ async def check_accessions(request):
 
     node = config.mercure.targets.get(node_name)
     if not isinstance(node, (DicomWebTarget, DicomTarget)):
-        return JSONResponse({"error": f"Invalid DICOM node"}, status_code=400)
+        return JSONErrorResponse(f"Invalid DICOM node '{node_name}'.", status_code=400)
     
-    with Connection(redis):
-        job = CheckAccessionsTask().create_job(accessions=accessions, node=node, search_filters=search_filters)
-        CheckAccessionsTask.queue().enqueue_job(job)
+    try:
+        with Connection(redis):
+            job = CheckAccessionsTask().create_job(accessions=accessions, node=node, search_filters=search_filters)
+            CheckAccessionsTask.queue().enqueue_job(job)
+    except Exception as e:
+        logger.exception("Error during accessions check task creation")
+        return JSONErrorResponse(str(e), status_code=500)
+
     return JSONResponse({"status": "pending", "job_id": job.id})
\ No newline at end of file
diff --git a/webinterface/rules.py b/webinterface/rules.py
index 213dc833..582735df 100755
--- a/webinterface/rules.py
+++ b/webinterface/rules.py
@@ -37,7 +37,7 @@
 
 @router.get("/")
 @requires("authenticated", redirect="login")
-async def show_rules(request) -> Response:
+async def rules(request) -> Response:
     """Show all defined routing rules. Can be executed by all logged-in users."""
     try:
         config.read_config()

From bcab65165902428d66b2ef5ee057339645276d2b Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Thu, 26 Sep 2024 22:24:43 +0000
Subject: [PATCH 40/42] pagination in ui

---
 common/types.py                               |  34 +-
 dispatch/target_types/base.py                 |   4 +
 tests/test_query.py                           |   4 +-
 webinterface/dashboards/query/jobs.py         |   8 +-
 webinterface/templates/base.html              | 112 ++++-
 .../templates/dashboards/dashboards.html      |   7 +-
 webinterface/templates/dashboards/query.html  | 390 +++++++++++-------
 .../dashboards/query_job_fragment.html        |   4 +-
 webinterface/templates/modules.html           |  37 +-
 webinterface/templates/rules.html             |  76 ++--
 webinterface/templates/targets.html           |  40 +-
 webinterface/templates/targets/dicom-tls.html |  14 +-
 webinterface/templates/targets/dicom.html     |   8 +-
 webinterface/templates/targets/dicomweb.html  |   8 +-
 webinterface/templates/targets/folder.html    |   2 +-
 webinterface/templates/targets/rsync.html     |   8 +-
 webinterface/templates/targets/s3.html        |   4 +-
 webinterface/templates/targets/sftp.html      |   6 +-
 webinterface/templates/targets/xnat.html      |   6 +-
 webinterface/templates/users.html             |  13 +
 20 files changed, 527 insertions(+), 258 deletions(-)

diff --git a/common/types.py b/common/types.py
index fd9ee39e..e985285c 100755
--- a/common/types.py
+++ b/common/types.py
@@ -27,6 +27,9 @@ class Target(BaseModel, Compat):
     comment: str = ""
     direction: Optional[Literal["pull", "push", "both"]] = "push"
 
+    @property
+    def short_description(self) -> str:
+        return ""
     @classmethod
     def __get_validators__(cls):
         # one or more validators may be yielded which will be called in the
@@ -60,6 +63,10 @@ class DicomTarget(Target):
     aet_target: str
     aet_source: Optional[str] = ""
 
+    @property
+    def short_description(self) -> str:
+        return f"{self.ip}:{self.port}"
+
 
 class DicomTLSTarget(Target):
     target_type: Literal["dicomtls"] = "dicomtls"
@@ -71,6 +78,9 @@ class DicomTLSTarget(Target):
     tls_cert: str
     ca_cert: str
 
+    @property
+    def short_description(self) -> str:
+        return f"{self.ip}:{self.port}"
 
 class SftpTarget(Target):
     target_type: Literal["sftp"] = "sftp"
@@ -79,6 +89,10 @@ class SftpTarget(Target):
     host: str
     password: Optional[str]
 
+    @property
+    def short_description(self) -> str:
+        return f"{self.folder}:{self.host}"
+
 
 class RsyncTarget(Target):
     target_type: Literal["rsync"] = "rsync"
@@ -87,7 +101,10 @@ class RsyncTarget(Target):
     host: str
     password: Optional[str]
     run_on_complete: bool = False
-
+    
+    @property
+    def short_description(self) -> str:
+        return f"{self.host}:{self.folder}"
 
 class XnatTarget(Target):
     target_type: Literal["xnat"] = "xnat"
@@ -96,6 +113,10 @@ class XnatTarget(Target):
     user: str
     password: str
 
+    @property
+    def short_description(self) -> str:
+        return self.host
+
 
 class DicomWebTarget(Target):
     target_type: Literal["dicomweb"] = "dicomweb"
@@ -107,6 +128,10 @@ class DicomWebTarget(Target):
     http_user: Optional[str] = None
     http_password: Optional[str] = None
 
+    @property
+    def short_description(self) -> str:
+        return self.url
+
 
 class S3Target(Target):
     target_type: Literal["s3"] = "s3"
@@ -116,11 +141,18 @@ class S3Target(Target):
     access_key_id: str
     secret_access_key: str
 
+    @property
+    def short_description(self) -> str:
+        return f"{self.bucket}/{self.prefix}"
+
 
 class FolderTarget(Target):
     target_type: Literal["folder"] = "folder"
     folder: str
 
+    @property
+    def short_description(self) -> str:
+        return self.folder
 
 class DummyTarget(Target):
     target_type: Literal["dummy"] = "dummy"
diff --git a/dispatch/target_types/base.py b/dispatch/target_types/base.py
index ba4764b0..39f7ad73 100644
--- a/dispatch/target_types/base.py
+++ b/dispatch/target_types/base.py
@@ -28,6 +28,10 @@ class TargetHandler(Generic[TargetTypeVar]):
     def __init__(self):
         pass
 
+    @property
+    def info_short(self) -> str:
+        return ""
+
     def send_to_target(
         self,
         task_id: str,
diff --git a/tests/test_query.py b/tests/test_query.py
index 880b7dee..ccb09178 100644
--- a/tests/test_query.py
+++ b/tests/test_query.py
@@ -1,7 +1,7 @@
 import os
 from pathlib import Path
 import tempfile
-from typing import Dict, Optional
+from typing import Dict, Optional, Tuple
 import pydicom
 import pytest
 from pynetdicom import AE, evt, StoragePresentationContexts, build_role
@@ -255,7 +255,7 @@ def test_query_operations(dicomweb_server, tempdir, dummy_datasets, fs, rq_conne
     assert task.meta['completed'] == len(dummy_datasets)
     assert task.meta['total'] == len(dummy_datasets)
 
-def test_query_retry(dicom_server_2: tuple[DicomTarget,DummyDICOMServer], tempdir, dummy_datasets, fs, rq_connection):
+def test_query_retry(dicom_server_2: Tuple[DicomTarget,DummyDICOMServer], tempdir, dummy_datasets, fs, rq_connection):
     (tempdir / "outdir").mkdir()
     target, server = dicom_server_2
     task = QueryPipeline.create([ds.AccessionNumber for ds in dummy_datasets.values()], {}, target, (tempdir / "outdir"))
diff --git a/webinterface/dashboards/query/jobs.py b/webinterface/dashboards/query/jobs.py
index 7bbcd5f7..d6b6697f 100644
--- a/webinterface/dashboards/query/jobs.py
+++ b/webinterface/dashboards/query/jobs.py
@@ -142,7 +142,7 @@ def get_accession(cls, job_id, accession: str, node: Union[DicomTarget, DicomWeb
 
     def execute(self, *, accession:str, node: Union[DicomTarget, DicomWebTarget], search_filters:Dict[str, List[str]], path: str):
         print(f"Getting {accession}")
-        def error_handler(reason):
+        def error_handler(reason) -> None:
             logger.error(reason)
             if not job_parent:
                 raise
@@ -157,7 +157,7 @@ def error_handler(reason):
             logger.info("Cancelled sibling jobs.")
             if not job_parent.meta.get("failed_reason"):
                 job_parent.meta["failed_reason"] = reason
-                job_parent.save_meta()
+                job_parent.save_meta() # type: ignore
                 Queue(job_parent.origin)._enqueue_job(job_parent,at_front=True) # Force the parent job to run and fail itself
 
         job = cast(Job,self._job)
@@ -235,14 +235,14 @@ def execute(self, *, accessions, subjobs, path, destination, move_promptly) -> s
                     err = f"Failure during move to destination {destination}: {e}" if destination else f"Failure during move to {config.mercure.incoming_folder}: {e}"
                     logger.error(err)
                     job.meta["failed_reason"] = err
-                    job.save_meta()
+                    job.save_meta()  # type: ignore
                     raise
         # subprocess.run(["./bin/ubuntu22.04/getdcmtags", filename, self.called_aet, "MERCURE"],check=True)
 
         logger.info(f"Removing job directory {path}")
         shutil.rmtree(path)
         job.meta["failed_reason"] = None
-        job.save_meta()
+        job.save_meta() # type: ignore
 
         return "Job complete"
 
diff --git a/webinterface/templates/base.html b/webinterface/templates/base.html
index 53016ca7..80a7a88f 100755
--- a/webinterface/templates/base.html
+++ b/webinterface/templates/base.html
@@ -35,33 +35,30 @@
         </a>
       </div>
       <div id="navbarMainMenu" class="navbar-menu">
+        {% macro highlight(the_page) -%}
+            {% if page != the_page %}has-text-grey-light{% endif %}
+        {%- endmacro %}
         <div class="navbar-start">
           {% if logged_in %}
-          <a class="navbar-item {% if page != 'homepage' %}has-text-grey-light{% endif %}" href="/">
+          <a class="navbar-item {{highlight('homepage')}}" href="/">
             Overview
           </a>
-          <a class="navbar-item {% if page != 'rules' %}has-text-grey-light{% endif %}" href="/rules">
-            Rules
-          </a>
-          <a class="navbar-item {% if page != 'targets' %}has-text-grey-light{% endif %}" href="/targets">
-            Targets
+          <a class="navbar-item {{highlight('queue')}}" href="/queue">
+            Queue
           </a>
-          <a class="navbar-item {% if page != 'modules' %}has-text-grey-light{% endif %}" href="/modules">
-            Modules
+          <a class="navbar-item {% if page not in ['rules', 'targets','modules', 'users'] %} has-text-grey-light{%endif%}" href="/rules">
+            Rules
           </a>
           {% if is_admin %}
-          <a class="navbar-item {% if page != 'users' %}has-text-grey-light{% endif %}" href="/users">
-            Users
-          </a>
-          <a class="navbar-item {% if page != 'logs' %}has-text-grey-light{% endif %}" href="/logs">
+          <a class="navbar-item {{highlight('logs')}}" href="/logs">
             Logs
           </a>
           {% endif %}
-          <a class="navbar-item {% if page != 'configuration' %}has-text-grey-light{% endif %}" href="/configuration">
-            Configuration
+          <a class="navbar-item {{highlight('dashboards')}}" href="/dashboards">
+            Tools
           </a>
-          <a class="navbar-item {% if page != 'queue' %}has-text-grey-light{% endif %}" href="/queue">
-            Queue
+          <a class="navbar-item {{highlight('configuration')}}" href="/configuration">
+            Configuration
           </a>
           {% endif %}
         </div>
@@ -94,7 +91,22 @@
       </div>
     </div>
   </nav>
-  {% block extra_nav %} {% endblock %}
+  {% block extra_nav %} 
+  {% if page in ['rules','targets','modules', 'users'] %}
+  <section>
+    <div class="container tabs">
+        <ul>
+          <li class="{% if page == 'rules' %}is-active{% endif %}"><a href="/rules">Rules</a></li>
+          <li class="{% if page == 'targets' %}is-active{% endif %}"><a href="/targets">Targets</a></li>
+          <li class="{% if page == 'modules' %}is-active{% endif %}"><a href="/modules">Modules</a></li>
+          {% if is_admin %}
+            <li class="{% if page == 'users' %}is-active{% endif %}"><a href="/users">Users</a></li>
+          {% endif %}
+        </ul>
+      </div>
+    </section>
+    {% endif %}
+  {% endblock %}
 
   <section class="section" style="flex: 1;">
     <div class="container">
@@ -117,6 +129,72 @@
   <script type="module">
     import { JSONEditor } from "{{ url_for('static', path='/js/svelte-jsoneditor.js') }}"
 
+    function paginate(cards, items_per_page=10) {
+        const paginationList = document.getElementById('paginationList');
+        const searchInput = document.getElementById('searchInput');
+        searchInput.value = '';
+        const ruleCards = cards;
+        const itemsPerPage = items_per_page; // Adjust this value to change items per page
+        let currentPage = 1;
+
+        function showPage(page) {
+            const startIndex = (page - 1) * itemsPerPage;
+            const endIndex = startIndex + itemsPerPage;
+            let visibleCount = 0;
+            
+            Array.from(ruleCards).forEach((card, index) => {
+                if (card.style.display !== 'none') {
+                    visibleCount++;
+                    if (visibleCount > startIndex && visibleCount <= endIndex) {
+                        card.classList.remove('is-hidden');
+                    } else {
+                        card.classList.add('is-hidden');
+                    }
+                }
+            });
+
+            updatePagination();
+        }
+
+        function updatePagination() {
+            const visibleCards = Array.from(ruleCards).filter(card => card.style.display !== 'none');
+            const pageCount = Math.ceil(visibleCards.length / itemsPerPage);
+
+            paginationList.innerHTML = '';
+            for (let i = 1; i <= pageCount; i++) {
+                const li = document.createElement('li');
+                const a = document.createElement('a');
+                a.classList.add('pagination-link');
+                if (i === currentPage) {
+                    a.classList.add('is-current');
+                }
+                a.setAttribute('aria-label', `Goto page ${i}`);
+                a.textContent = i;
+                a.addEventListener('click', () => {
+                    currentPage = i;
+                    showPage(currentPage);
+                });
+                li.appendChild(a);
+                paginationList.appendChild(li);
+            }
+        }
+
+        searchInput.addEventListener('input', function() {
+            const searchTerm = this.value.toLowerCase();
+            Array.from(ruleCards).forEach( card => {
+                const ruleName = card.getAttribute('data-name').toLowerCase();
+                if (ruleName.includes(searchTerm)) {
+                    card.style.display = 'block';
+                } else {
+                    card.style.display = 'none';
+                }
+            });
+            currentPage = 1;
+            showPage(currentPage);
+        });
+        showPage(currentPage);
+    }
+    window.paginate = paginate;
     $(document).ready(function () {
       // Check for click events on the navbar burger icon
       $(".navbar-burger").click(function () {
diff --git a/webinterface/templates/dashboards/dashboards.html b/webinterface/templates/dashboards/dashboards.html
index afe990b0..502176c9 100644
--- a/webinterface/templates/dashboards/dashboards.html
+++ b/webinterface/templates/dashboards/dashboards.html
@@ -5,9 +5,12 @@
 <div class="container">
 <div class="tabs logtabs" style="margin-top: 40px;">
     <ul>
+      <li class="{% if page == 'query' %}is-active{% endif %}"><a href="query">DICOM Query</a></li>
+      {% if is_admin %}
       <li class="{% if page == 'tests' %}is-active{% endif %}"><a href="tests">Self-test</a></li>
-      <li class="{% if page == 'tasks' %}is-active{% endif %}"><a href="tasks">Tasks</a></li>
-      <li class="{% if page == 'query' %}is-active{% endif %}"><a href="query">Query</a></li>
+      {% endif %}
+      <!-- <li class="{% if page == 'tasks' %}is-active{% endif %}"><a href="tasks">Tasks</a></li> -->
+
     </ul>
   </div>
   </div>
diff --git a/webinterface/templates/dashboards/query.html b/webinterface/templates/dashboards/query.html
index 3b915556..ca5f7f45 100644
--- a/webinterface/templates/dashboards/query.html
+++ b/webinterface/templates/dashboards/query.html
@@ -5,6 +5,7 @@
 {% block extra_head %}
     <script type="text/javascript" src="{{ url_for('static', path='DataTables/datatables.min.js') }}"></script>
     <link rel="stylesheet" type="text/css" href="{{ url_for('static', path='DataTables/datatables.min.css') }}"/>  
+    <script type="text/javascript" src="{{ url_for('static', path='/js/bulma-quickview.min.js') }}"></script>    
 {% endblock %}
 
 {% block dashboard_content %}
@@ -16,7 +17,7 @@ <h1 class="title">DICOM Query</h1>
         Redis connection not available, so this dashboard will not function.
       </div>
       {% endif %}
-        <form class="box" id="form" hx-post="query" hx-target="#query_result" hx-swap="innerHTML">
+        <form class="box" id="form">
             <div class="field is-horizontal">
               <div class="field-label is-normal">
                 <label class="label">Accession</label>
@@ -89,7 +90,7 @@ <h1 class="title">DICOM Query</h1>
                   <div class="control is-expanded">
                     <div class="select">
                         <select name="destination">
-                          <option>Mercure</option>
+                          <option value="">Mercure</option>
                           <option disabled>————————</option>
                           {% for destination in destination_folders %}
                           <option>{{ destination }}</option>
@@ -100,10 +101,16 @@ <h1 class="title">DICOM Query</h1>
                 </div>
               </div>
             </div>
+            <span class="has-tooltip-right has-tooltip-success" data-tooltip="Fallback Rule"><i class="fas fa-magnet"></i></span>
 
             <div class="field is-horizontal">
               <div class="field-label is-normal">
-                <label class="label">Offpeak</label>
+                <label class="label">Offpeak <i class="fas fa-question-circle"></i></label> 
+                <span class="button has-tooltip-left has-tooltip-success" data-tooltip="Auto Update">
+                  <i class="far fa-clock"></i></span>
+                  <span class="icon has-tooltip-left has-tooltip-success" data-tooltip="Auto Update">
+                    <i class="far fa-clock"></i></span>
+  
               </div>
               <div class="field-body">
                 <div class="field">
@@ -123,34 +130,25 @@ <h1 class="title">DICOM Query</h1>
               <div class="field-body">
                 <div class="field">
                   <div class="control">
-                    <button type="submit" class="button is-primary">
-                      Query
-                    </button>
-                    <button type="button" id="check-accessions" class="button is-info">
+                    <button type="button" id="check-accessions-button" class="button is-info">
                       Check Accessions
                     </button>
+                    <button type="submit" id="get-accessions-button" class="button is-primary">
+                      Get Accessions
+                    </button>
                   </div>
                 </div>
               </div>
             </div>
           </form>
-          <div id="query_result"></div>
-          <div id="check-accessions-result" style="display: none;">
-            <table id="check-accessions-table" class="table is-narrow is-hoverable is-fullwidth">
-              <thead>
-                <tr>
-                  <th>Accession</th>
-                  <th>Study Description</th>
-                  <th>Series Description</th>
-                  <th>Instances</th>
-                </tr>
-              </thead>
-            </table>
+          <div class="tabs" id="query_result_tabs">
+            <ul>
+              <li class="is-active"><a data-tab="get-accessions">Get Accessions</a></li>
+              <li><a data-tab="check-accessions">Check Accessions</a></li>
+            </ul>
           </div>
-          <div class="columns">
-
-        <div class="column">
-            <table class="table is-narrow is-hoverable is-fullwidth jobtable" id="casetable">
+          <div id="get-accessions" class="tab-content">
+            <table id="get-accessions-table" class="table is-narrow is-hoverable is-fullwidth jobtable">
                 <thead>
                     <tr>
                         <th></th>
@@ -163,52 +161,100 @@ <h1 class="title">DICOM Query</h1>
                         <th>progress</th>
                     </tr>
                 </thead>
-                <tbody>
-                </tbody>
+                <tbody></tbody>
             </table>
-            </div>
-            </div>
+          </div>
+          <div id="check-accessions" class="tab-content" style="display:none;">
+            <table id="check-accessions-table" class="table is-narrow is-hoverable is-fullwidth">
+              <thead>
+                <tr>
+                  <th>Accession</th>
+                  <th>Study Description</th>
+                  <th>Series Description</th>
+                  <th>Instances</th>
+                </tr>
+              </thead>
+            </table>
+          </div>
     </div>
   </div> 
 
 </main>
 <script>
-$(document).ready(function () {      
-  $("#form").on('htmx:afterOnLoad', (event) => {
-      datatable.ajax.reload();
-  });
+$(document).ready(function () {
+    // Add tab functionality
+    $('#query_result_tabs a').on('click', function(e) {
+        e.preventDefault();
+        // Remove active class from all tabs
+        $('#query_result_tabs li').removeClass('is-active');
+        // Add active class to clicked tab
+        $(this).parent().addClass('is-active');
+
+        // Hide all tab content
+        $('.tab-content').hide();
+        // Show corresponding tab content
+        $('#' + $(this).data('tab')).show();
+    });
+
+    // // Show the first tab by default
+    // $('#query-results').show();
+
 
   function namespacedEvents(config) {
-        var unique = config._eventNamespace;
-        return 'draw.dt.DT' + unique + ' select.dt.DT' + unique + ' deselect.dt.DT' + unique;
-  }
+          var unique = config._eventNamespace;
+          return 'draw.dt.DT' + unique + ' select.dt.DT' + unique + ' deselect.dt.DT' + unique;
+    }
     var _buttonNamespace = 0;
     my_selected_button = {
-		text: 'Selected',
-		className: 'buttons-selected',
-        enabled: function(dt,config) {
-           rows = dt.rows({ selected: true });
-           return rows.any();
-        },
-		init: function (dt, node, config) {
-			var that = this;
-			config._eventNamespace = '.select' + _buttonNamespace++;
-			// .DT namespace listeners are removed by DataTables automatically
-			// on table destroy
-      // console.log(config);
-			dt.on(namespacedEvents(config), function () {
-				that.enable(config.enabled(dt, node, config));
-			});
+      text: 'Selected',
+      className: 'buttons-selected',
+          enabled: function(dt,config) {
+              rows = dt.rows({ selected: true });
+              return rows.any();
+          },
+      init: function (dt, node, config) {
+        var that = this;
+        config._eventNamespace = '.select' + _buttonNamespace++;
+        // .DT namespace listeners are removed by DataTables automatically
+        // on table destroy
+        // console.log(config);
+        dt.on(namespacedEvents(config), function () {
+          that.enable(config.enabled(dt, node, config));
+        });
 
-			this.disable();
-		},
-		destroy: function (dt, node, config) {
-			dt.off(config._eventNamespace);
-		}}
+        this.disable();
+      },
+      destroy: function (dt, node, config) {
+        dt.off(config._eventNamespace);
+    }}
 
     $.fn.dataTable.ext.buttons.customEnable = my_selected_button;
+    $('#get-accessions-button').on('click', async function(e) {
+      e.preventDefault();
+      $('a[data-tab="get-accessions"]').click();
+      if (! $('input[name=\'accession\']').val()) { 
+        alert('Accession number required!');
+        return false 
+      };
+      var body = new FormData(document.querySelector("#form"));
+      try {
+        result = await fetch("query", {
+          method:"POST",
+          body: body
+        })
+        result_json = await result.json();
+        if (result_json.error) {
+          alert(`Error: ${result_json.error}`);
+          return;
+        }
+        window.get_accessions_table.ajax.reload();
+      } catch (err) {
+        alert(`Unexpected error`);
+        console.error(err);
+      }
+    });
 
-    window.datatable = $('#casetable').DataTable({           
+    window.get_accessions_table = $('#get-accessions-table').DataTable({           
         dom: "<'row browsertoolbar align-items-end'<'col-sm-12 col-md-7 browserbuttons'B><'col-sm-12 col-md-2'><'col-sm-12 col-md-3'f>>" + "<'row'<'col-sm-12'tr>>" + "<'row browserfooterbar'<'col-sm-12 col-md-5'l><'col-sm-12 col-md-7'p>>",
         ajax: "query/jobs",
         deferRender: true,
@@ -222,7 +268,7 @@ <h1 class="title">DICOM Query</h1>
             { data: 'id' },
             { data: 'meta', render: data => (data["type"]? data["type"]:"") + (data["offpeak"]? " (offpeak)":"")},
             { data: 'status' },
-            { data: 'created_at', render: data => `<span style="display:none;">${data || Date.now()  }</span>`+(data? new Date(data).toLocaleString("en-US"):"")},
+            { data: 'created_at', render: data => `<span style="display:none;">${data || Date.now()}</span>`+(data? new Date(data).toLocaleString("en-US"):"")},
             { data: 'parameters', render: data => data["accession"] || ""},
             { data: 'result' },
             { data: 'progress'},
@@ -232,123 +278,161 @@ <h1 class="title">DICOM Query</h1>
             style: 'os'
         },
         language: {
-            "emptyTable": "No messages available on server."
+            "emptyTable": "No query records."
         },
         // filter: true,
         buttons: [
         {
-                    extend: "customEnable",
-                    text: '<i class="fas fa-sync"></i>&nbsp;Retry',
-                    titleAttr: 'test',
-                    enabled: function(dt, node, config) {
-                      let data = dt.row({selected: true}).data();
-                      if (!data) {
-                          return false;
-                      }
-                      return data.status == "failed"
-                    },
-                    action: function ( e, dt, node, config ) {
-                      let data = dt.row({selected: true}).data();
-                      fetch(`query/retry_job?id=${data.id}`, {method:"POST"}).then(()=>{
-                            dt.ajax.reload()
-                        }).catch((err)=>{
-                            console.log("Error: ", err)
-                        })
-                    }
+          text: '<i class="fas fa-sync"></i>&nbsp;Refresh',
+          action: function ( e, dt, button, config ) {
+            dt.ajax.reload();
+          }
+        },
+        {
+          extend: "customEnable",
+          text: '<i class="fas fa-cog"></i>&nbsp;Retry',
+          titleAttr: 'Retry',
+          enabled: function(dt, node, config) {
+            let data = dt.row({selected: true}).data();
+            if (!data) {
+                return false;
+            }
+            return data.status == "failed";
+          },
+          action: function ( e, dt, node, config ) {
+            let data = dt.row({selected: true}).data();
+            fetch(`query/retry_job?id=${data.id}`, {method:"POST"}).then(()=>{
+                  dt.ajax.reload()
+              }).catch((err)=>{
+                  console.log("Error: ", err)
+              })
+          }
           },
           {
-                    extend: "customEnable",
-                    text: '<i class="fas fa-pause"></i>&nbsp;Pause',
-                    titleAttr: 'Pause/Resume',
-                    enabled: function(dt, node, config) {
-                      let data = dt.row({selected: true}).data();
-                      if (!data) {
-                          return false;
-                      }
-                      if (data.status == "paused") {
-                        node.html('<i class="fas fa-play"></i>&nbsp;Resume')
-                      } else {
-                        node.html('<i class="fas fa-pause"></i>&nbsp;Pause')
-                      }
-                      return (data.status == "paused" || data.status == "deferred" || data.status == "queued" || data.status == "running");
-                    },
-                    action: function (e, dt, node, config) {
-                        let data = dt.row({selected: true}).data();
-                        
-                        if (data.status == "paused") {
-                          operation = "resume";
-                        } else if (data.status == "deferred" || data.status == "running" || data.status == "queued")  {
-                          operation = "pause";
-                        } else {
-                          alert("???");
-                          return;
-                        }
-                        fetch(`query/${operation}_job?id=${data.id}`, {method:"POST"}).then(()=>{
-                            dt.ajax.reload()
-                        }).catch((err)=>{
-                            console.log("Error: ", err)
-                        })
-                    }
-                },
+            extend: "customEnable",
+            text: '<i class="fas fa-pause"></i>&nbsp;Pause',
+            titleAttr: 'Pause/Resume',
+            enabled: function(dt, node, config) {
+              let data = dt.row({selected: true}).data();
+              if (!data) {
+                  return false;
+              }
+              if (data.status == "paused") {
+                node.html('<i class="fas fa-play"></i>&nbsp;Resume')
+              } else {
+                node.html('<i class="fas fa-pause"></i>&nbsp;Pause')
+              }
+              return (data.status == "paused" || data.status == "deferred" || data.status == "queued" || data.status == "running");
+            },
+            action: function (e, dt, node, config) {
+                let data = dt.row({selected: true}).data();
+                
+                if (data.status == "paused") {
+                  operation = "resume";
+                } else if (data.status == "deferred" || data.status == "running" || data.status == "queued")  {
+                  operation = "pause";
+                } else {
+                  alert("???");
+                  return;
+                }
+                fetch(`query/${operation}_job?id=${data.id}`, {method:"POST"}).then(()=>{
+                    dt.ajax.reload()
+                }).catch((err)=>{
+                    console.log("Error: ", err)
+                })
+            }
+        },
         ],
         order: [[4, 'desc']],
-        initComplete: function() {             
-        }
+        initComplete: function() {}
     });
     var jobId;
     var errMessage;
-    $('#check-accessions').on('click', function(e) {
+    var accessionTableConfig = {
+        columns: [{ data: 'AccessionNumber' }, {data: 'StudyDescription'},  { data: 'SeriesDescription' }, {data: 'NumberOfSeriesRelatedInstances'}], 
+        order: [[0, 'asc']],
+        pageLength: 25,
+        language: { "emptyTable": ()=> errMessage || "No series found or query in progress." } 
+    }
+    var checkAccessionsTimer;
+    var checkAccessionsTimeout;
+    window.check_accessions_table = $('#check-accessions-table').DataTable(accessionTableConfig);
+    window.check_accessions_table.draw();
+    $('#check-accessions-button').on('click', function(e) {
         e.preventDefault();
+        $('a[data-tab="check-accessions"]').click();
+        if (jobId) {
+          alert("whoops");
+        }
         var accessions = $('input[name="accession"]').val();
         var dicomNode = $('select[name="dicom_node"]').val();
-        errMessage = null;
-        $('#check-accessions-result').show();
 
+        if (!accessions) {
+          alert("Accession number required!");
+          return;
+        }
+        errMessage = null;
         if ($.fn.DataTable.isDataTable('#check-accessions-table')) {
             $('#check-accessions-table').DataTable().destroy();
         }
-
-        $('#check-accessions-table').DataTable({
-            ajax: {
-                url: "query/check_accessions",
-                type: "POST",
-                data: function(d) {
-                    return {
-                        accessions: accessions,
-                        series_description: $('input[name="series_description"]').val(),
-                        study_description: $('input[name="study_description"]').val(),
-                        dicom_node: dicomNode,
-                        job_id: jobId
-                    };
-                },
-                dataSrc: function(json) {
-                    console.log("Data: ", json)
-                    if (json.status === "pending") {
-                        jobId = json.job_id;
-                        setTimeout(function() {
-                            $('#check-accessions-table').DataTable().ajax.reload();
-                        }, 1000);
-                        return [];
-                    } else if (json.status === "completed") {
-                      jobId = null;
-                      return json.result
-                    } else if (json.status === "failed") {
-                      jobId = null;
-                      errMessage = json.info;
-                      return [];
-                    }
-                }
-            },
-            columns: [{ data: 'AccessionNumber' }, {data: 'StudyDescription'},  { data: 'SeriesDescription' }, {data: 'NumberOfSeriesRelatedInstances'}], 
-            order: [[0, 'asc']],
-            pageLength: 25,
-            language: { "emptyTable": ()=> errMessage || "No series found or query in progress." } 
-            }); 
+        checkAccessionsTimeout = setTimeout(function() {
+            if (checkAccessionsTimer) { 
+              clearTimeout(checkAccessionsTimer);
+              checkAccessionsTimer = null;
+              jobId = null;
+              errMessage = "Timeout waiting for response from server. Please try again later.";
+              $('#form button').removeAttr('disabled');
+              window.check_accessions_table.draw();
+            }
+        }, 5000);
+        accessionTableConfig.ajax = {
+          url: "query/check_accessions",
+          type: "POST",
+          data: function(d) {
+              return {
+                  accessions: accessions,
+                  series_description: $('input[name="series_description"]').val(),
+                  study_description: $('input[name="study_description"]').val(),
+                  dicom_node: dicomNode,
+                  job_id: jobId
+              };
+          },
+          dataSrc: function(json) {
+              // console.log("Data: ", json)
+              if (json.status === "pending") {
+                  jobId = json.job_id;
+                  checkAccessionsTimer = setTimeout(function() {
+                      $('#check-accessions-table').DataTable().ajax.reload();
+                  }, 500);
+                  errMessage = "Loading..."
+                  return [];
+              } else if (json.status === "completed") {
+                checkAccessionsTimer = null
+                jobId = null;
+                errMessage = null;
+                clearTimeout(checkAccessionsTimeout)
+                $('#form button').removeAttr('disabled');
+                return json.result;
+              } else if (json.status === "failed") {
+                errMessage = json.info;
+              } else {
+                errMessage = "Unknown error"
+              }
+              $('#form button').removeAttr('disabled');
+              checkAccessionsTimer = null
+              jobId = null;
+              clearTimeout(checkAccessionsTimeout)
+              return [];
+          }
+      }
+      $('#form button').attr('disabled','disabled')
+      window.check_accessions_table = $('#check-accessions-table').DataTable(accessionTableConfig);
+      $('#check-accessions-result').show();
     });
 
-    window.datatable.on('click', 'td.dt-control', function (e) {
+    window.get_accessions_table.on('click', 'td.dt-control', function (e) {
       let tr = e.target.closest('tr');
-      let row = window.datatable.row(tr);
+      let row = window.get_accessions_table.row(tr);
   
       if (row.child.isShown()) {
           // This row is already open - close it
@@ -361,6 +445,8 @@ <h1 class="title">DICOM Query</h1>
               response => response.text()
             ).then(data=>{
               row.child(data).show();
+            }).catch(err => {
+              console.error('Error:', err); alert(err);
             });
       }
   });
diff --git a/webinterface/templates/dashboards/query_job_fragment.html b/webinterface/templates/dashboards/query_job_fragment.html
index 36314c81..c4b1ff9b 100644
--- a/webinterface/templates/dashboards/query_job_fragment.html
+++ b/webinterface/templates/dashboards/query_job_fragment.html
@@ -1,3 +1,4 @@
+<div style="max-height:30em; overflow-y: auto;" >
 <table>
     <tr>
         <th>
@@ -26,4 +27,5 @@
         <td>{{job['progress'] or ''}}</td>
     </tr>
     {% endfor %}
-</table>
\ No newline at end of file
+</table>
+</div>
diff --git a/webinterface/templates/modules.html b/webinterface/templates/modules.html
index 500bdb68..2d64c300 100755
--- a/webinterface/templates/modules.html
+++ b/webinterface/templates/modules.html
@@ -12,11 +12,21 @@
     <main role="main">
         <div class="container">
             <h1 class="title">Processing Modules</h1>
-            {% for x in modules %}
-                <div class="card rulecard">
+            <div class="field">
+                <div class="control has-icons-left">
+                    <input class="input" type="text" id="searchInput" placeholder="Search..." value="">
+                    <span class="icon is-small is-left">
+                        <i class="fas fa-search"></i>
+                    </span>
+                </div>
+            </div>
+    
+            {% for module_name, module in modules.items() %}
+                <div class="card rulecard" data-name="{{module_name}}">
                     <header class="card-header has-background-light">
                         <p class="card-header-title card-toggle">
-                            <span class="icon"><i class="fas fa-cogs fa-lg"></i></span>&nbsp;&nbsp;{{ x }}
+                            <span class="icon"><i class="fas fa-cogs fa-lg"></i></span>&nbsp;&nbsp;{{ module_name }}
+                            <span style="margin-left: auto; font-weight: 200;">{{module.docker_tag|truncate(50, True)}}</span>
                         </p>
                         <a class="card-header-icon card-toggle">
                             <i class="fa fa-angle-down"></i>
@@ -28,24 +38,24 @@ <h1 class="title">Processing Modules</h1>
                                 <col width="150">
                                 <tr>
                                     <td>Docker Tag:</td>
-                                    <td>{{ modules[x]['docker_tag'] }}</td>
+                                    <td>{{ module.docker_tag }}</td>
                                 </tr>
                                 <tr>
                                     <td>Contact:</td>
-                                    <td>{{ modules[x]['contact'] }}</td>
+                                    <td>{{ module.contact }}</td>
                                 </tr>                                
                                 <tr>
                                     <td>Comment:</td>
-                                    <td>{{ modules[x]['comment'] }}</td>
+                                    <td>{{ module.comment }}</td>
                                 </tr>                                
                             </table>
                             <div class="buttons is-right">
                                 {% if is_admin %}
-                                    <a class="button is-success" href="/modules/edit/{{x}}"><i
+                                    <a class="button is-success" href="/modules/edit/{{module_name}}"><i
                                             class="fas fa-pen"></i>&nbsp;Edit</a>
-                                    <button class="button is-danger" id="confirm-me" value="{{x}}"
-                                            onclick="confirmDelete(this.value)" {% if x in used_modules%}disabled
-                                            title="Cannot delete because target is used by rule '{{ used_modules[x] }}'" {% endif %}><i
+                                    <button class="button is-danger" id="confirm-me" value="{{module_name}}"
+                                            onclick="confirmDelete(this.value)" {% if module_name in used_modules%}disabled
+                                            title="Cannot delete because target is used by rule '{{ used_module }}'" {% endif %}><i
                                             class="fas fa-trash-alt"></i>&nbsp;Delete</button>
                                 {% endif %}
                             </div>
@@ -53,7 +63,11 @@ <h1 class="title">Processing Modules</h1>
                     </div>
                 </div>
             {% endfor %}
-
+            <nav class="pagination is-centered" role="navigation" aria-label="pagination">
+                <ul class="pagination-list" id="paginationList">
+                </ul>
+            </nav>
+    
             {% if is_admin %}
                 <div class="buttons is-left" style="margin-top: 20px;">
                     <button class="button is-success" onclick="showAddModal()"><i class="fas fa-plus"></i>&nbsp;Install
@@ -137,6 +151,7 @@ <h1 class="title">Processing Modules</h1>
                     e.currentTarget.parentElement.parentElement.childNodes[3].classList.toggle('is-hidden');
                 });
             }
+            paginate(document.getElementsByClassName('rulecard'))
         });
 
         function showAddModal(val) {
diff --git a/webinterface/templates/rules.html b/webinterface/templates/rules.html
index fd35b838..754d3812 100755
--- a/webinterface/templates/rules.html
+++ b/webinterface/templates/rules.html
@@ -10,38 +10,50 @@
 <main role="main">
     <div class="container">
         <h1 class="title">DICOM Rules</h1>
-        {% for x in rules %}
-        <div class="card rulecard">
+
+        <div class="field">
+            <div class="control has-icons-left">
+                <input class="input" type="text" id="searchInput" placeholder="Search rules..." value="">
+                <span class="icon is-small is-left">
+                    <i class="fas fa-search"></i>
+                </span>
+            </div>
+        </div>
+    
+
+        {% for rule_name,rule in rules.items() %}
+        <div class="card rulecard" data-name="{{rule_name}}">
             <header class="card-header has-background-light ">
-                <p class="card-header-title card-toggle {% if rules[x]['disabled']==True %}has-text-grey-light{% endif %}">
-                    <span class="icon {% if rules[x]['disabled']!=True %}{% else %}has-text-grey-light{% endif %} has-tooltip-left {% if rules[x]['disabled']!=True %}has-tooltip-success{% endif %}" data-tooltip=
-                    {% if rules[x]['disabled']==True %}
+                <p class="card-header-title card-toggle {% if rule.disabled %}has-text-grey-light{% endif %}">
+                    <span class="icon {% if rule.disabled %}has-text-grey-light{% endif %} has-tooltip-left {% if not rule.disabled %}has-tooltip-success{% endif %}"
+                    data-tooltip=
+                    {% if rule.disabled==True %}
                     "Disabled"
                     {% else %}
-                    {% if rules[x]['action']=='route' %}"Routing Only"
-                    {% elif rules[x]['action']=='both' %}"Processing & Routing"
-                    {% elif rules[x]['action']=='process' %}"Processing Only"
-                    {% elif rules[x]['action']=='notification' %}"Notification Only"
-                    {% elif rules[x]['action']=='discard' %}"Force Discard"
+                    {% if rule.action=='route' %}"Routing Only"
+                    {% elif rule.action=='both' %}"Processing & Routing"
+                    {% elif rule.action=='process' %}"Processing Only"
+                    {% elif rule.action=='notification' %}"Notification Only"
+                    {% elif rule.action=='discard' %}"Force Discard"
                     {% else %}""
                     {% endif %}
                     {% endif %}>
-                    {% if rules[x]['action']=='route' %}<i class="fas fa-directions fa-lg"></i>
-                    {% elif rules[x]['action']=='both' %}<i class="fas fa-layer-group fa-lg"></i>
-                    {% elif rules[x]['action']=='process' %}<i class="fas fa-microchip fa-lg"></i>
-                    {% elif rules[x]['action']=='notification' %}<i class="fas fa-bullhorn fa-lg"></i>
-                    {% elif rules[x]['action']=='discard' %}<i class="fas fa-ban fa-lg"></i>
+                    {% if rule.action=='route' %}<i class="fas fa-directions fa-lg"></i>
+                    {% elif rule.action=='both' %}<i class="fas fa-layer-group fa-lg"></i>
+                    {% elif rule.action=='process' %}<i class="fas fa-microchip fa-lg"></i>
+                    {% elif rule.action=='notification' %}<i class="fas fa-bullhorn fa-lg"></i>
+                    {% elif rule.action=='discard' %}<i class="fas fa-ban fa-lg"></i>
                     {% else %}<i class=" fas fa-robot fa-lg"></i>
-                    {% endif %}</span>&nbsp;&nbsp;{{ x }}<span style="margin-left: auto;"></span>
-                    {% if rules[x]['fallback']==True %}
+                    {% endif %}</span>&nbsp;&nbsp;{{ rule_name }}<span style="margin-left: auto;"></span>
+                    {% if rule.fallback==True %}
                     <span class="has-tooltip-right has-tooltip-success" data-tooltip="Fallback Rule"><i class="fas fa-magnet ruleicon"></i></span>
                     {% endif %}
-                    {% if rules[x]['priority']=='urgent' %}
+                    {% if rule.priority=='urgent' %}
                     <span class="has-tooltip-right has-tooltip-success" data-tooltip="Urgent Processing"><i class="fas fa-shipping-fast ruleicon"></i></span>
-                    {% elif rules[x]['priority']=='offpeak' %}
+                    {% elif rule.priority=='offpeak' %}
                     <span class="has-tooltip-right has-tooltip-success" data-tooltip="Off-Peak Processing"><i class="fas fa-bed ruleicon"></i></span>
                     {% endif %}
-                    {% if rules[x]['notification_webhook']!='' %}
+                    {% if rule.notification_webhook!='' %}
                     <span class="has-tooltip-right has-tooltip-success" data-tooltip="Sending Notification"><i class="fas fa-bell ruleicon"></i></span>
                     {% endif %}
                 </p>
@@ -55,33 +67,33 @@ <h1 class="title">DICOM Rules</h1>
                         <col width="150">
                         <tr>
                             <td>Rule:</td>
-                            <td>{{ rules[x]['rule'] }}</td>
+                            <td>{{ rule.rule }}</td>
                         </tr>
-                        {% if (rules[x]['action']=='process') or (rules[x]['action']=='both') %}
+                        {% if (rule.action=='process') or (rule.action=='both') %}
                         <tr>
                             <td>Processing:</td>
-                            <td>{% for i in rules[x]['processing_module'] %} {{ i }} {% if not loop.last %}&#10140; {% endif %} {% endfor %}</td>
+                            <td>{% for i in rule.processing_module %} {{ i }} {% if not loop.last %}&#10140; {% endif %} {% endfor %}</td>
                         </tr>
                         {% endif %}
-                        {% if (rules[x]['action']=='route') or (rules[x]['action']=='both') %}
+                        {% if (rule.action=='route') or (rule.action=='both') %}
                         <tr>
                             <td>Target:</td>
-                            <td>{{ rules[x]['target'] }}</td>
+                            <td>{{ rule.target }}</td>
                         </tr>
                         {% endif %}
                         <tr>
                             <td>Contact:</td>
-                            <td>{{ rules[x]['contact'] }}</td>
+                            <td>{{ rule.contact }}</td>
                         </tr>
                         <tr>
                             <td>Comment:</td>
-                            <td>{{ rules[x]['comment'] }}</td>
+                            <td>{{ rule.comment }}</td>
                         </tr>
                     </table>
                     <div class="buttons is-right">
                         {% if is_admin %}
-                        <a class="button is-success" href="/rules/edit/{{x}}"><i class="fas fa-pen"></i>&nbsp;Edit</a>
-                        <button class="button is-danger" id="confirm-me" value="{{x}}"
+                        <a class="button is-success" href="/rules/edit/{{rule_name}}"><i class="fas fa-pen"></i>&nbsp;Edit</a>
+                        <button class="button is-danger" id="confirm-me" value="{{rule_name}}"
                             onclick="confirmDelete(this.value)"><i class="fas fa-trash-alt"></i>&nbsp;Delete</button>
                         {% endif %}
                     </div>
@@ -89,6 +101,11 @@ <h1 class="title">DICOM Rules</h1>
             </div>
         </div>
         {% endfor %}
+        <nav class="pagination is-centered" role="navigation" aria-label="pagination">
+            <ul class="pagination-list" id="paginationList">
+            </ul>
+        </nav>
+        
         {% if is_admin %}
         <div class="buttons is-left" style="margin-top: 20px;">
             <button class="button is-success" onclick="showAddModal()"><i class="fas fa-plus"></i>&nbsp;Add New</button>
@@ -149,6 +166,7 @@ <h1 class="title">DICOM Rules</h1>
                 e.currentTarget.parentElement.parentElement.childNodes[3].classList.toggle('is-hidden');
             });
         }
+        paginate(document.getElementsByClassName('rulecard'))
     });
 
     function showAddModal(val) {
diff --git a/webinterface/templates/targets.html b/webinterface/templates/targets.html
index 1f97e392..c1c3a324 100755
--- a/webinterface/templates/targets.html
+++ b/webinterface/templates/targets.html
@@ -6,12 +6,24 @@
 <main role="main">
     <div class="container">
         <h1 class="title">Routing Targets</h1>
+        <div class="field">
+            <div class="control has-icons-left">
+                <input class="input" type="text" id="searchInput" placeholder="Search rules..." value="">
+                <span class="icon is-small is-left">
+                    <i class="fas fa-search"></i>
+                </span>
+            </div>
+        </div>
         <div id="targets">
-        {% for x in targets %}
-        <div class="card rulecard">
+        {% for target_name, target in targets.items() %}
+        <div class="card rulecard" data-name="{{ target_name }}">
             <header class="card-header has-background-light">
                 <p class="card-header-title card-toggle">
-                    <span class="icon has-tooltip-left has-tooltip-success" data-tooltip="{{get_target_handler(targets[x]).display_name}} Target"><i class="fas {{get_target_handler(targets[x]).icon}} fa-lg"></i></span>&nbsp;&nbsp;{{ x }}
+                    <span class="icon has-tooltip-left has-tooltip-success" data-tooltip="{{get_target_handler(target).display_name}} Target"><i class="fas {{get_target_handler(target).icon}} fa-lg"></i></span>
+                    &nbsp;&nbsp;{{ target_name }}<span style="margin-left:auto; font-weight: 200;"> {{target.short_description}}
+                        &nbsp;<i class="has-text-grey fa {% if target.direction=='pull' %}fa-download{%elif target.direction=='push'%}fa-upload{%elif target.direction=='both'%}fa-server{%endif%}"></i>
+
+                    </span>
                 </p>
                 <a class="card-header-icon card-toggle">
                     <i class="fa fa-angle-down"></i>
@@ -21,27 +33,27 @@ <h1 class="title">Routing Targets</h1>
                 <div class="content">
                     <table class="table is-narrow" style="margin-bottom: 8px;">
                         <col width="150">
-                        {% include get_target_handler(targets[x]).view_template %}
+                        {% include get_target_handler(target).view_template %}
                         <tr>
                             <td>Direction:</td>
-                            <td>{{ targets[x].direction }}</td>
+                            <td>{{ target.direction }}</td>
                         </tr>
                         <tr>
                             <td>Contact:</td>
-                            <td>{{ targets[x].contact }}</td>
+                            <td>{{ target.contact }}</td>
                         </tr>
                         <tr>
                             <td>Comment:</td>
-                            <td>{{ targets[x].comment }}</td>
+                            <td>{{ target.comment }}</td>
                         </tr>                                
                     </table>
                     <div class="buttons is-right">
-                        <button type="button" class="button is-dark" value="{{x}}" id="testbtn_{{x}}" hx-post="/targets/test/{{x}}" hx-target="#target_test_result"><i class="fas fa-satellite-dish"></i>&nbsp;Test</button>
+                        <button type="button" class="button is-dark" value="{{target_name}}" id="testbtn_{{target_name}}" hx-post="/targets/test/{{target_name}}" hx-target="#target_test_result"><i class="fas fa-satellite-dish"></i>&nbsp;Test</button>
                         {% if is_admin %}
-                        <a class="button is-success" href="/targets/edit/{{x}}"><i class="fas fa-pen"></i>&nbsp;Edit</a>
-                        <button class="button is-danger" id="confirm-me" value="{{x}}"
+                        <a class="button is-success" href="/targets/edit/{{target_name}}"><i class="fas fa-pen"></i>&nbsp;Edit</a>
+                        <button class="button is-danger" id="confirm-me" value="{{target_name}}"
                             onclick="confirmDelete(this.value)" {% if x in used_targets%}disabled
-                            title="Cannot delete because target is used by rule '{{ used_targets[x] }}'" {% endif %}><i
+                            title="Cannot delete because target is used by rule '{{ used_targets[target_name] }}'" {% endif %}><i
                                 class="fas fa-trash-alt"></i>&nbsp;Delete</button>
                         {% endif %}
                     </div>
@@ -49,6 +61,11 @@ <h1 class="title">Routing Targets</h1>
             </div>
         </div>
         {% endfor %}
+        <nav class="pagination is-centered" role="navigation" aria-label="pagination">
+            <ul class="pagination-list" id="paginationList">
+            </ul>
+        </nav>
+
         </div>
         {% if is_admin %}
         <div class="buttons is-left" style="margin-top: 20px;">
@@ -132,6 +149,7 @@ <h1 class="title">Routing Targets</h1>
                 e.currentTarget.parentElement.parentElement.childNodes[3].classList.toggle('is-hidden');
             });
         }
+        paginate(document.getElementsByClassName('rulecard'))
     });
 
     function showAddModal(val) {
diff --git a/webinterface/templates/targets/dicom-tls.html b/webinterface/templates/targets/dicom-tls.html
index 82aab646..6d61525a 100644
--- a/webinterface/templates/targets/dicom-tls.html
+++ b/webinterface/templates/targets/dicom-tls.html
@@ -4,29 +4,29 @@
 </tr>
 <tr>
     <td>Host/IP:</td>
-    <td>{{ targets[x].ip }}</td>
+    <td>{{ target.ip }}</td>
 </tr>
 <tr>
     <td>Port:</td>
-    <td>{{ targets[x].port }}</td>
+    <td>{{ target.port }}</td>
 </tr>
 <tr>
     <td>AET Target:</td>
-    <td>{{ targets[x].aet_target }}</td>
+    <td>{{ target.aet_target }}</td>
 </tr>
 <tr>
     <td>AET Source:</td>
-    <td>{{ targets[x].aet_source }}</td>
+    <td>{{ target.aet_source }}</td>
 </tr>
 <tr>
     <td>TLS Key:</td>
-    <td>{{ targets[x].tls_key }}</td>
+    <td>{{ target.tls_key }}</td>
 </tr>
 <tr>
     <td>TLS Certificate:</td>
-    <td>{{ targets[x].tls_cert }}</td>
+    <td>{{ target.tls_cert }}</td>
 </tr>
 <tr>
     <td>CA Certificate:</td>
-    <td>{{ targets[x].ca_cert }}</td>
+    <td>{{ target.ca_cert }}</td>
 </tr>
diff --git a/webinterface/templates/targets/dicom.html b/webinterface/templates/targets/dicom.html
index f76d3c1c..79722ad3 100644
--- a/webinterface/templates/targets/dicom.html
+++ b/webinterface/templates/targets/dicom.html
@@ -4,17 +4,17 @@
 </tr>
 <tr>
     <td>Host/IP:</td>
-    <td>{% if targets[x].ip == 'sender' %}<i class="fas fa-exchange-alt fa-lg"></i>&nbsp; Loop back to sender{% else %}{{ targets[x].ip }}{% endif %}</td>
+    <td>{% if target.ip == 'sender' %}<i class="fas fa-exchange-alt fa-lg"></i>&nbsp; Loop back to sender{% else %}{{ target.ip }}{% endif %}</td>
 </tr>
 <tr>
     <td>Port:</td>
-    <td>{{ targets[x].port }}</td>
+    <td>{{ target.port }}</td>
 </tr>
 <tr>
     <td>AET Target:</td>
-    <td>{{ targets[x].aet_target }}</td>
+    <td>{{ target.aet_target }}</td>
 </tr>
 <tr>
     <td>AET Source:</td>
-    <td>{{ targets[x].aet_source }}</td>
+    <td>{{ target.aet_source }}</td>
 </tr>
\ No newline at end of file
diff --git a/webinterface/templates/targets/dicomweb.html b/webinterface/templates/targets/dicomweb.html
index 461e6a54..2a3602c0 100644
--- a/webinterface/templates/targets/dicomweb.html
+++ b/webinterface/templates/targets/dicomweb.html
@@ -4,17 +4,17 @@
 </tr>
 <tr>
     <td>URL:</td>
-    <td>{{ targets[x].url }}</td>
+    <td>{{ target.url }}</td>
 </tr>
 <!-- <tr>
     <td>Port:</td>
-    <td>{{ targets[x].port }}</td>
+    <td>{{ target.port }}</td>
 </tr>
 <tr>
     <td>AET Target:</td>
-    <td>{{ targets[x].aet_target }}</td>
+    <td>{{ target.aet_target }}</td>
 </tr>
 <tr>
     <td>AET Source:</td>
-    <td>{{ targets[x].aet_source }}</td>
+    <td>{{ target.aet_source }}</td>
 </tr> -->
\ No newline at end of file
diff --git a/webinterface/templates/targets/folder.html b/webinterface/templates/targets/folder.html
index b8222bf9..a522e14f 100755
--- a/webinterface/templates/targets/folder.html
+++ b/webinterface/templates/targets/folder.html
@@ -4,5 +4,5 @@
 </tr>
 <tr>
     <td>Folder:</td>
-    <td>{{ targets[x].folder }}</td>
+    <td>{{ target.folder }}</td>
 </tr>
\ No newline at end of file
diff --git a/webinterface/templates/targets/rsync.html b/webinterface/templates/targets/rsync.html
index 8c7d49d4..228ac6a1 100644
--- a/webinterface/templates/targets/rsync.html
+++ b/webinterface/templates/targets/rsync.html
@@ -4,17 +4,17 @@
 </tr>
 <tr>
     <td>Host/IP:</td>
-    <td>{{ targets[x].host }}</td>
+    <td>{{ target.host }}</td>
 </tr>
 <tr>
     <td>User:</td>
-    <td>{{ targets[x].user }}</td>
+    <td>{{ target.user }}</td>
 </tr>
 <tr>
     <td>Folder:</td>
-    <td>{{ targets[x].folder }}</td>
+    <td>{{ target.folder }}</td>
 </tr>
 <tr>
     <td>Run on complete:</td>
-    <td>{{ targets[x].run_on_complete }}</td>
+    <td>{{ target.run_on_complete }}</td>
 </tr>
\ No newline at end of file
diff --git a/webinterface/templates/targets/s3.html b/webinterface/templates/targets/s3.html
index 1e9c08a0..ab9b3bb5 100644
--- a/webinterface/templates/targets/s3.html
+++ b/webinterface/templates/targets/s3.html
@@ -4,9 +4,9 @@
 </tr>
 <tr>
     <td>Bucket:</td>
-    <td>{{ targets[x].bucket }}</td>
+    <td>{{ target.bucket }}</td>
 </tr>
 <tr>
     <td>Prefix:</td>
-    <td>{{ targets[x].prefix }}</td>
+    <td>{{ target.prefix }}</td>
 </tr>
\ No newline at end of file
diff --git a/webinterface/templates/targets/sftp.html b/webinterface/templates/targets/sftp.html
index 859064c1..0e4e9bd2 100644
--- a/webinterface/templates/targets/sftp.html
+++ b/webinterface/templates/targets/sftp.html
@@ -4,13 +4,13 @@
 </tr>
 <tr>
     <td>Host/IP:</td>
-    <td>{{ targets[x].host }}</td>
+    <td>{{ target.host }}</td>
 </tr>
 <tr>
     <td>User:</td>
-    <td>{{ targets[x].user }}</td>
+    <td>{{ target.user }}</td>
 </tr>
 <tr>
     <td>Folder:</td>
-    <td>{{ targets[x].folder }}</td>
+    <td>{{ target.folder }}</td>
 </tr>
\ No newline at end of file
diff --git a/webinterface/templates/targets/xnat.html b/webinterface/templates/targets/xnat.html
index 9a3cabd9..56a8464d 100644
--- a/webinterface/templates/targets/xnat.html
+++ b/webinterface/templates/targets/xnat.html
@@ -4,13 +4,13 @@
 </tr>
 <tr>
     <td>Host/IP:</td>
-    <td>{{ targets[x].host }}</td>
+    <td>{{ target.host }}</td>
 </tr>
 <tr>
     <td>User:</td>
-    <td>{{ targets[x].user }}</td>
+    <td>{{ target.user }}</td>
 </tr>
 <tr>
     <td>Project:</td>
-    <td>{{ targets[x].project_id }}</td>
+    <td>{{ target.project_id }}</td>
 </tr>
\ No newline at end of file
diff --git a/webinterface/templates/users.html b/webinterface/templates/users.html
index 9d5ccb15..1eef161e 100755
--- a/webinterface/templates/users.html
+++ b/webinterface/templates/users.html
@@ -6,6 +6,14 @@
 <main role="main">
     <div class="container">
         <h1 class="title">Users</h1>
+        <div class="field">
+            <div class="control has-icons-left">
+                <input class="input" type="text" id="searchInput" placeholder="Search..." value="">
+                <span class="icon is-small is-left">
+                    <i class="fas fa-search"></i>
+                </span>
+            </div>
+        </div>
         {% for x in users %}
         <div class="card rulecard">
             <header class="card-header has-background-light">
@@ -49,6 +57,10 @@ <h1 class="title">Users</h1>
             </div>
         </div>
         {% endfor %}
+        <nav class="pagination is-centered" role="navigation" aria-label="pagination">
+            <ul class="pagination-list" id="paginationList">
+            </ul>
+        </nav>
         {% if is_admin %}
         <div class="buttons is-left" style="margin-top: 20px;">
             <button class="button is-success" onclick="showAddModal()"><i class="fas fa-plus"></i>&nbsp;Add New</button>
@@ -119,6 +131,7 @@ <h1 class="title">Users</h1>
                 e.currentTarget.parentElement.parentElement.childNodes[3].classList.toggle('is-hidden');
             });
         }
+        paginate(document.getElementsByClassName('rulecard'))
     });
 
     function showAddModal(val) {

From 9abff2ade194ae0c8bae5fe037e965e7a364a1bf Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Fri, 27 Sep 2024 16:15:28 +0000
Subject: [PATCH 41/42] fix test

---
 tests/test_query.py | 7 +++----
 1 file changed, 3 insertions(+), 4 deletions(-)

diff --git a/tests/test_query.py b/tests/test_query.py
index ccb09178..3bd41fb7 100644
--- a/tests/test_query.py
+++ b/tests/test_query.py
@@ -183,14 +183,13 @@ def test_get_accession_job(dicom_server, dicomweb_server, mercure_config):
         assert results[0].remaining == 0
         assert pydicom.dcmread(next(k for k in Path(config.jobs_folder).rglob("*.dcm"))).AccessionNumber == MOCK_ACCESSIONS[0]
 
-def test_query_job(dicom_server, tempdir):
+def test_query_job(dicom_server, tempdir, rq_connection):
     """
     Test the create_job function.
     We use mocker to mock the queue and avoid actually creating jobs.
     """
     job = QueryPipeline.create([MOCK_ACCESSIONS[0]], {}, dicom_server, str(tempdir))
-    assert job
-    w = SimpleWorker(["mercure_fast", "mercure_slow"], connection=redis)
+    w = SimpleWorker(["mercure_fast", "mercure_slow"], connection=rq_connection)
     w.work(burst=True)
     # assert len(list(Path(config.mercure.jobs_folder).iterdir())) == 1
     print([k for k in Path(tempdir).rglob('*')])
@@ -266,7 +265,7 @@ def test_query_retry(dicom_server_2: Tuple[DicomTarget,DummyDICOMServer], tempdi
     task.get_meta()
     assert task.meta['completed'] == 1
     assert task.meta['total'] == len(dummy_datasets)
-    assert "Failed to retrieve accession" in task.meta['failed_reason']
+    assert "Failure during retrieval" in task.meta['failed_reason']
     # Retry the query
     server.remaining_allowed_accessions = None
     task.retry()

From 6dee9c6a5e94d1ea065aa0c518439913c95f20cb Mon Sep 17 00:00:00 2001
From: Roy Wiggins <Roy.Wiggins@nyulangone.org>
Date: Tue, 1 Oct 2024 23:12:01 +0000
Subject: [PATCH 42/42] fix

---
 webinterface/templates/dashboards/query.html | 8 +-------
 1 file changed, 1 insertion(+), 7 deletions(-)

diff --git a/webinterface/templates/dashboards/query.html b/webinterface/templates/dashboards/query.html
index ca5f7f45..5ac35b0c 100644
--- a/webinterface/templates/dashboards/query.html
+++ b/webinterface/templates/dashboards/query.html
@@ -101,15 +101,9 @@ <h1 class="title">DICOM Query</h1>
                 </div>
               </div>
             </div>
-            <span class="has-tooltip-right has-tooltip-success" data-tooltip="Fallback Rule"><i class="fas fa-magnet"></i></span>
-
             <div class="field is-horizontal">
               <div class="field-label is-normal">
-                <label class="label">Offpeak <i class="fas fa-question-circle"></i></label> 
-                <span class="button has-tooltip-left has-tooltip-success" data-tooltip="Auto Update">
-                  <i class="far fa-clock"></i></span>
-                  <span class="icon has-tooltip-left has-tooltip-success" data-tooltip="Auto Update">
-                    <i class="far fa-clock"></i></span>
+                <label class="label">Offpeak </label>
   
               </div>
               <div class="field-body">