-
Notifications
You must be signed in to change notification settings - Fork 9
/
Copy pathacapy_events_processor.py
431 lines (360 loc) · 17.1 KB
/
acapy_events_processor.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
import asyncio
import datetime
import sys
from typing import Any, Dict, List, NoReturn
from uuid import uuid4
import orjson
from shared import APIRouter
from shared.constants import GOVERNANCE_LABEL
from shared.log_config import get_logger
from shared.models.endorsement import (
obfuscate_primary_data_in_payload,
payload_is_applicable_for_endorser,
)
from shared.util.rich_parsing import parse_json_with_error_handling
from webhooks.models import AcaPyWebhookEvent, topic_mapping
from webhooks.models.conversions import acapy_to_cloudapi_event
from webhooks.models.redis_payloads import AcaPyRedisEvent
from webhooks.services.billing_manager import is_applicable_for_billing
from webhooks.services.webhooks_redis_service import WebhooksRedisService
logger = get_logger(__name__)
router = APIRouter()
class AcaPyEventsProcessor:
"""
Class to process ACA-Py webhook events that the plugin writes to redis.
"""
def __init__(self, redis_service: WebhooksRedisService) -> None:
self.redis_service = redis_service
# Redis prefix for acapy events:
self.acapy_redis_prefix = self.redis_service.acapy_redis_prefix
# Event for indicating redis keyspace notifications
self._new_event_notification = asyncio.Event()
self._pubsub = None # for managing redis pubsub connection
self._pubsub_thread = None
self._tasks: List[asyncio.Task] = [] # To keep track of running tasks
def start(self) -> None:
"""
Start the background tasks as part of AcaPyEventsProcessor's lifecycle
"""
# self._start_notification_listener() # disable as it is currently unused
self._tasks.append(
asyncio.create_task(
self._process_incoming_events(), name="Process incoming events"
)
)
logger.info("AcaPyEventsProcessor started.")
async def stop(self) -> None:
"""
Stops all background tasks gracefully.
"""
for task in self._tasks:
task.cancel() # Request cancellation of the task
try:
await task # Wait for the task to be cancelled
except asyncio.CancelledError:
pass # Expected error upon cancellation, can be ignored
self._tasks.clear() # Clear the list of tasks
if self._pubsub_thread:
self._pubsub_thread.stop()
logger.info("Stopped AcaPyEvents pubsub thread")
if self._pubsub:
await asyncio.sleep(0.1) # allow thread to stop before disconnecting
self._pubsub.disconnect()
logger.info("Disconnected AcaPyEvents pubsub instance")
logger.info("AcaPyEventsProcessor stopped.")
def are_tasks_running(self) -> bool:
"""
Checks if the background tasks are still running.
Returns:
True if all background tasks are running, False if any task has stopped.
"""
logger.debug("Checking if all tasks are running")
# todo: disabling pubsub thread check as it's currently unused and disconnects periodically on test env
pubsub_thread_running = (
True # self._pubsub_thread and self._pubsub_thread.is_alive()
)
tasks_running = self._tasks and all(not task.done() for task in self._tasks)
if not pubsub_thread_running:
logger.error("Pubsub thread is not running")
if not tasks_running:
for task in self._tasks:
if task.done():
logger.error("Task `{}` is not running", task.get_name())
all_running = tasks_running and pubsub_thread_running
logger.debug("All tasks running: {}", all_running)
return all_running
def _rpush_notification_handler(self, msg) -> None:
"""
Processing handler for when rpush notifications are received
"""
logger.trace("Received rpush notification: {}", msg)
self._new_event_notification.set()
def _start_notification_listener(self) -> None:
"""
Listens for keyspace notifications from Redis and sets an event to resume processing.
"""
# Example subscription pattern for keyspace notifications. Adjust as necessary.
self._pubsub = self.redis_service.redis.pubsub()
# Subscribe this pubsub channel to the notification pattern (rpush represents ACA-Py writing to list types)
notification_pattern = "__keyevent@0__:rpush"
self._pubsub.psubscribe(
**{notification_pattern: self._rpush_notification_handler}
)
self._pubsub_thread = self._pubsub.run_in_thread(sleep_time=0.01)
logger.info("Notification listener subscribed to redis keyspace notifications")
async def _process_incoming_events(self) -> NoReturn:
"""
Processing handler for incoming ACA-Py redis webhooks events
"""
logger.info("Starting ACA-Py Events Processor")
exception_count = 0
max_exception_count = 5 # break inf loop after 5 consecutive exceptions
attempts_without_events = 0
max_attempts_without_events = sys.maxsize # use max int to never stop
sleep_duration = 0.1
while True:
try:
batch_event_keys = self.redis_service.scan_keys(
match_pattern=self.acapy_redis_prefix, count=10000
)
if batch_event_keys:
attempts_without_events = 0 # Reset the counter
for list_key in batch_event_keys: # the keys are of LIST type
logger.debug("Attempt to process list key: {}", list_key)
self._attempt_process_list_events(list_key)
else:
attempts_without_events += 1
if attempts_without_events >= max_attempts_without_events:
# Wait for a keyspace notification before continuing
logger.debug(
(
"Scan has returned no keys {} times in a row. "
"Waiting for keyspace notification..."
),
max_attempts_without_events,
)
await self._new_event_notification.wait()
logger.debug("Keyspace notification triggered")
self._new_event_notification.clear() # Reset the event for the next wait
attempts_without_events = 0 # Reset the counter
else:
await asyncio.sleep(sleep_duration) # prevent a busy loop
exception_count = 0 # reset exception count after successful loop
except Exception: # pylint: disable=W0718
exception_count += 1
logger.exception(
"Something went wrong while processing incoming events. Continuing..."
)
if exception_count >= max_exception_count:
raise # exit inf loop
def _attempt_process_list_events(self, list_key: str) -> None:
"""
Attempts to process a list-based event in Redis, ensuring that only one instance processes
the event at a time by acquiring a lock.
Args:
list_key: The Redis key of the list to process.
"""
lock_key = f"lock:{list_key}"
extend_lock_task = None
lock_duration = 2000 # milliseconds
if self.redis_service.set_lock(lock_key, px=lock_duration):
try:
# Start a background task to extend the lock periodically
# This is just to ensure that on the off chance that 2000ms isn't enough to process all the
# events in the list, we want to avoid replicas processing the same webhook event twice
extend_lock_task = self.redis_service.extend_lock_task(
lock_key, interval=datetime.timedelta(milliseconds=lock_duration)
)
self._process_list_events(list_key)
except Exception as e: # pylint: disable=W0718
# if this particular event is unprocessable, we should remove it from the inputs, to avoid deadlocking
logger.error("Processing {} raised an exception: {}", list_key, e)
self._handle_unprocessable_event(list_key, e)
finally:
# Cancel the lock extension task if it's still running
if extend_lock_task:
extend_lock_task.cancel()
# Delete lock after processing list, whether it completed or errored:
if self.redis_service.delete_key(lock_key):
logger.debug("Deleted lock key: {}", lock_key)
else:
logger.warning(
"Could not delete lock key: {}. Perhaps it expired?", lock_key
)
else:
logger.debug(
"Event {} is currently being processed by another instance.", list_key
)
def _process_list_events(self, list_key) -> None:
"""
Processes all events in a Redis list until the list is empty. Each event is processed individually,
and upon successful processing, it's removed from the list.
Args:
list_key: The Redis key of the list to process.
Returns:
An exception if an error occurs during event processing; otherwise, returns None.
"""
try:
while True: # Keep processing until no elements are left
# Read 0th index of list:
event_data = self.redis_service.lindex(list_key)
if event_data:
self._process_event(event_data.decode())
# Cleanup: remove the element from the list and delete the lock if successfully processed
if self.redis_service.pop_first_list_element(list_key):
logger.debug(
"Removed processed element from list: {}", list_key
)
else:
logger.warning(
"Tried to pop list element from: {}, but already removed from list?",
list_key,
)
else:
# If no data is found, the list is empty, exit the loop
logger.debug(
"No more data found for event key: {}, exiting.", list_key
)
break
except Exception:
logger.exception("Could not process list key {}", list_key)
raise
def _process_event(self, event_json: str) -> None:
"""
Processes an individual ACA-Py event, transforming it to our CloudAPI format and saving/broadcasting to redis
Args:
event_json: The JSON string representation of the ACA-Py event.
"""
event = parse_json_with_error_handling(AcaPyRedisEvent, event_json, logger)
metadata_origin = event.metadata.origin
if metadata_origin:
origin = metadata_origin.lower()
else:
logger.warning("webhook event has unknown origin: {}", event)
origin = "unknown"
group_id = event.metadata.group_id
wallet_id = event.metadata.x_wallet_id or origin
acapy_topic = event.payload.category or event.payload.topic
# category is the original acapy_topic as we used to received over http
payload = event.payload.payload
obfuscated_payload = self._obfuscate_sensitive_data(
acapy_topic=acapy_topic, payload=payload
)
bound_logger = logger.bind(
body={
"wallet_id": wallet_id,
"acapy_topic": acapy_topic,
"origin": origin,
"group_id": group_id,
"payload": obfuscated_payload,
}
)
bound_logger.debug("Processing ACA-Py Redis webhook event")
# Map from the acapy webhook topic to a unified cloud api topic
cloudapi_topic = topic_mapping.get(acapy_topic)
if not cloudapi_topic:
bound_logger.warning(
"Not processing webhook event for acapy_topic `{}` as it doesn't exist in the topic_mapping",
acapy_topic,
)
return
acapy_webhook_event = AcaPyWebhookEvent(
payload=payload,
wallet_id=wallet_id,
acapy_topic=acapy_topic,
topic=cloudapi_topic,
group_id=group_id,
origin=origin,
)
cloudapi_webhook_event = acapy_to_cloudapi_event(acapy_webhook_event)
if not cloudapi_webhook_event:
bound_logger.warning(
"Not processing webhook event for topic `{}` as no transformer exists for the topic",
cloudapi_topic,
)
return
webhook_event_json = cloudapi_webhook_event.model_dump_json()
# Check if this webhook event should be forwarded to the Endorser service
if (
wallet_id == GOVERNANCE_LABEL # represents event for the governance agent
and cloudapi_topic == "endorsements"
and payload_is_applicable_for_endorser(payload, logger=bound_logger)
):
logger.debug("Forwarding endorsement event for Endorser service")
transaction_id = payload["transaction_id"] # check has asserted key exists
self.redis_service.add_endorsement_event(
event_json=webhook_event_json, transaction_id=transaction_id
)
# Check if event is billable, and get operation_type if it is an endorsement event
is_billable, operation_type = is_applicable_for_billing(
wallet_id=wallet_id,
group_id=group_id,
topic=cloudapi_topic,
payload=payload,
logger=bound_logger,
)
if is_billable:
bound_logger.debug(
"Forwarding billing event for Billing service",
)
if cloudapi_topic == "endorsements":
# Add the operation type to the payload for endorsements
# Simplifies the billing service's logic for determining the operation type
endorse_event: Dict[str, Any] = orjson.loads(webhook_event_json)
endorse_event["payload"]["type"] = operation_type
webhook_event_for_billing = orjson.dumps(endorse_event)
else:
webhook_event_for_billing = webhook_event_json
self.redis_service.add_billing_event(
event_json=webhook_event_for_billing,
group_id=group_id,
wallet_id=wallet_id,
timestamp_ns=event.metadata.time_ns,
)
# Add data to redis, which publishes to a redis pubsub channel that SseManager listens to
self.redis_service.add_cloudapi_webhook_event(
event_json=webhook_event_json,
group_id=group_id,
wallet_id=wallet_id,
timestamp_ns=event.metadata.time_ns,
)
bound_logger.trace("Successfully processed ACA-Py Redis webhook event.")
def _handle_unprocessable_event(self, key: str, error: Exception) -> None:
"""
Handles an event that could not be processed successfully. The unprocessable event is persisted
to a separate key for further investigation.
Args:
key: The Redis key where the problematic event was found.
error: The exception that occurred during event processing.
"""
logger.warning("Handling problematic event at key: {}", key)
problematic_event = self.redis_service.pop_first_list_element(key)
unprocessable_key = f"unprocessable:{key}:{uuid4().hex}"
error_message = f"Could not process: {problematic_event}. Error: {error}"
logger.warning(
"Saving record of problematic event at key: {}. Error: `{}`",
unprocessable_key,
error_message,
)
self.redis_service.set(key=unprocessable_key, value=error_message)
def _obfuscate_sensitive_data(
self, acapy_topic: str, payload: Dict[str, Any]
) -> Dict[str, Any]:
if acapy_topic == "endorse_transaction":
return obfuscate_primary_data_in_payload(payload, logger)
if acapy_topic == "issue_credential_v2_0_indy":
if (
"cred_request_metadata" in payload
and "master_secret_blinding_data" in payload["cred_request_metadata"]
):
obfuscated_payload = payload.copy()
master_secret_blinding_data = obfuscated_payload[
"cred_request_metadata"
]["master_secret_blinding_data"]
if "v_prime" in master_secret_blinding_data:
master_secret_blinding_data["v_prime"] = "REDACTED"
if "vr_prime" in master_secret_blinding_data:
master_secret_blinding_data["vr_prime"] = "REDACTED"
return obfuscated_payload
# No modification:
return payload