|
| 1 | +""" |
| 2 | +A backend that simply logs the statements to a xapi_tracking logger. |
| 3 | +
|
| 4 | +Vector just reads the log statements, so all we need to do is emit them. |
| 5 | +All other tasks use the raw Clickhouse inserts. |
| 6 | +""" |
| 7 | + |
| 8 | +import logging |
| 9 | +import sys |
| 10 | +from logging import Logger, getLogger |
| 11 | +from typing import List |
| 12 | + |
| 13 | +from xapi_db_load.backends.base_async_backend import ( |
| 14 | + BaseBackendTasks, |
| 15 | +) |
| 16 | +from xapi_db_load.backends.clickhouse import ( |
| 17 | + InsertBlocks, |
| 18 | + InsertCourses, |
| 19 | + InsertExternalIDs, |
| 20 | + InsertInitialEnrollments, |
| 21 | + InsertObjectTags, |
| 22 | + InsertProfiles, |
| 23 | + InsertTags, |
| 24 | + InsertTaxonomies, |
| 25 | + InsertXAPIEvents, |
| 26 | +) |
| 27 | +from xapi_db_load.generate_load_async import EventGenerator |
| 28 | + |
| 29 | + |
| 30 | +class AsyncVectorTasks(BaseBackendTasks): |
| 31 | + def __repr__(self) -> str: |
| 32 | + return f"AsyncVectorTasks: {self.config['db_host']}" |
| 33 | + |
| 34 | + def get_test_data_tasks(self): |
| 35 | + """ |
| 36 | + Return the tasks to be run. |
| 37 | + """ |
| 38 | + return [ |
| 39 | + self.event_generator, |
| 40 | + InsertInitialEnrollments(self.config, self.logger, self.event_generator), |
| 41 | + InsertCourses(self.config, self.logger, self.event_generator), |
| 42 | + InsertBlocks(self.config, self.logger, self.event_generator), |
| 43 | + InsertObjectTags(self.config, self.logger, self.event_generator), |
| 44 | + InsertTaxonomies(self.config, self.logger, self.event_generator), |
| 45 | + InsertTags(self.config, self.logger, self.event_generator), |
| 46 | + InsertExternalIDs(self.config, self.logger, self.event_generator), |
| 47 | + InsertProfiles(self.config, self.logger, self.event_generator), |
| 48 | + # This is the only change from the ClickHouse backend |
| 49 | + InsertXAPIEventsVector(self.config, self.logger, self.event_generator), |
| 50 | + ] |
| 51 | + |
| 52 | + |
| 53 | +class InsertXAPIEventsVector(InsertXAPIEvents): |
| 54 | + """ |
| 55 | + Wraps the ClickHouse direct backend so that the rest of the metadata can be sent while using |
| 56 | + Ralph to do the xAPI the insertion. |
| 57 | + """ |
| 58 | + |
| 59 | + def __init__(self, config: dict, logger: Logger, event_generator: EventGenerator): |
| 60 | + super().__init__(config, logger, event_generator) |
| 61 | + |
| 62 | + stream_handler = logging.StreamHandler(sys.stdout) |
| 63 | + # This formatter is different from what the LMS uses, but is the smallest possible |
| 64 | + # format that passes Vector's regex |
| 65 | + formatter = logging.Formatter(" [{name}] [] {message}", style="{") |
| 66 | + stream_handler.setFormatter(formatter) |
| 67 | + self.xapi_logger = getLogger("xapi_tracking") |
| 68 | + self.xapi_logger.setLevel(logging.INFO) |
| 69 | + self.xapi_logger.addHandler(stream_handler) |
| 70 | + |
| 71 | + def _format_row(self, row: dict): |
| 72 | + """ |
| 73 | + This overrides the ClickHouse backend's method to format the row for Ralph. |
| 74 | + """ |
| 75 | + return row["event"] |
| 76 | + |
| 77 | + async def _do_insert(self, out_data: List): |
| 78 | + """ |
| 79 | + POST a batch of rows to Ralph instead of inserting directly to ClickHouse. |
| 80 | + """ |
| 81 | + for event_json in out_data: |
| 82 | + self.xapi_logger.info(event_json) |
0 commit comments