test: Add logger tests

PostHog · Nov 3, 2023 · 0206f1b · 0206f1b
1 parent ed57cc9
commit 0206f1b
Showing 1 changed file with 379 additions and 0 deletions.
diff --git a/posthog/temporal/tests/batch_exports/test_logger.py b/posthog/temporal/tests/batch_exports/test_logger.py
@@ -0,0 +1,379 @@
+import asyncio
+import dataclasses
+import datetime as dt
+import json
+import random
+import time
+import uuid
+
+import aiokafka
+import freezegun
+import pytest
+import pytest_asyncio
+import structlog
+import temporalio.activity
+import temporalio.testing
+from django.conf import settings
+
+from posthog.clickhouse.client import sync_execute
+from posthog.clickhouse.log_entries import (
+    KAFKA_LOG_ENTRIES_TABLE_SQL,
+    LOG_ENTRIES_TABLE,
+    LOG_ENTRIES_TABLE_MV_SQL,
+    TRUNCATE_LOG_ENTRIES_TABLE_SQL,
+)
+from posthog.kafka_client.topics import KAFKA_LOG_ENTRIES
+from posthog.temporal.workflows.logger import bind_batch_exports_logger, configure_logger
+
+pytestmark = [pytest.mark.asyncio_event_loop, pytest.mark.asyncio]
+
+
+class LogCapture:
+    """A test StructLog processor to capture logs."""
+
+    def __init__(self):
+        self.entries = []
+
+    def __call__(self, logger, method_name, event_dict):
+        """Append event_dict to entries and drop the log."""
+        self.entries.append(event_dict)
+        raise structlog.DropEvent()
+
+
+@pytest.fixture()
+def log_capture():
+    """Return a LogCapture processor for inspection in tests."""
+    return LogCapture()
+
+
+class QueueCapture(asyncio.Queue):
+    """A test asyncio.Queue that captures items that we put into it."""
+
+    def __init__(self, *args, **kwargs):
+        super().__init__(*args, **kwargs)
+        self.entries = []
+
+    def put_nowait(self, item):
+        """Append item to entries and delegate to asyncio.Queue."""
+        self.entries.append(item)
+        super().put_nowait(item)
+
+
+@pytest_asyncio.fixture()
+async def queue():
+    """Return a QueueCapture queue for inspection in tests."""
+    queue = QueueCapture(maxsize=-1)
+
+    yield queue
+
+
+class CaptureKafkaProducer(aiokafka.AIOKafkaProducer):
+    """A test aiokafka.AIOKafkaProducer that captures calls to send_and_wait."""
+
+    def __init__(self, *args, **kwargs):
+        super().__init__(*args, **kwargs)
+        self.entries = []
+
+    async def send_and_wait(self, topic, value=None, key=None, partition=None, timestamp_ms=None, headers=None):
+        """Append an entry and delegate to aiokafka.AIOKafkaProducer."""
+
+        self.entries.append(
+            {
+                "topic": topic,
+                "value": value,
+                "key": key,
+                "partition": partition,
+                "timestamp_ms": timestamp_ms,
+                "headers": headers,
+            }
+        )
+        return await super().send_and_wait(topic, value, key, partition, timestamp_ms, headers)
+
+
+@pytest_asyncio.fixture(scope="function")
+async def producer(event_loop):
+    """Yield a CaptureKafkaProducer to inspect entries captured.
+
+    After usage, we ensure the producer was closed to avoid leaking/warnings.
+    """
+    producer = CaptureKafkaProducer(bootstrap_servers=settings.KAFKA_HOSTS, loop=event_loop)
+
+    yield producer
+
+    if producer._closed is False:
+        await producer.stop()
+
+
+@pytest_asyncio.fixture(autouse=True)
+async def configure(log_capture, queue, producer):
+    """Configure StructLog logging for testing.
+
+    The extra parameters configured for testing are:
+    * Add a LogCapture processor to capture logs.
+    * Set the queue and producer to capture messages sent.
+    * Do not cache logger to ensure each test starts clean.
+    """
+    tasks = await configure_logger(
+        extra_processors=[log_capture], queue=queue, producer=producer, cache_logger_on_first_use=False
+    )
+    yield tasks
+
+    for task in tasks:
+        # Clean up logger tasks to avoid leaking/warnings.
+        task.cancel()
+
+    await asyncio.wait(tasks)
+
+
+@pytest.mark.asyncio
+async def test_batch_exports_logger_binds_context(log_capture):
+    """Test whether we can bind context variables."""
+    logger = await bind_batch_exports_logger(team_id=1, destination="Somewhere")
+
+    logger.info("Hi! This is an info log")
+    logger.error("Hi! This is an erro log")
+
+    assert len(log_capture.entries) == 2
+
+    info_entry, error_entry = log_capture.entries
+    info_dict, error_dict = json.loads(info_entry), json.loads(error_entry)
+    assert info_dict["team_id"] == 1
+    assert info_dict["destination"] == "Somewhere"
+
+    assert error_dict["team_id"] == 1
+    assert error_dict["destination"] == "Somewhere"
+
+
+@pytest.mark.asyncio
+async def test_batch_exports_logger_formats_positional_args(log_capture):
+    """Test whether positional arguments are formatted in the message."""
+    logger = await bind_batch_exports_logger(team_id=1, destination="Somewhere")
+
+    logger.info("Hi! This is an %s log", "info")
+    logger.error("Hi! This is an %s log", "error")
+
+    assert len(log_capture.entries) == 2
+
+    info_entry, error_entry = log_capture.entries
+    info_dict, error_dict = json.loads(info_entry), json.loads(error_entry)
+    assert info_dict["msg"] == "Hi! This is an info log"
+    assert error_dict["msg"] == "Hi! This is an error log"
+
+
+@dataclasses.dataclass
+class TestActivityInfo:
+    """Provide our own Activity Info for testing."""
+
+    workflow_id: str
+    workflow_type: str
+    workflow_run_id: str
+    attempt: int
+
+
+@pytest.fixture
+def activity_environment(request):
+    """Return a testing temporal ActivityEnvironment."""
+    env = temporalio.testing.ActivityEnvironment()
+    env.info = request.param
+    return env
+
+
+BATCH_EXPORT_ID = str(uuid.uuid4())
+
+
+@pytest.mark.parametrize(
+    "activity_environment",
+    [
+        TestActivityInfo(
+            workflow_id=f"{BATCH_EXPORT_ID}-{dt.datetime.utcnow()}",
+            workflow_type="s3-export",
+            workflow_run_id=str(uuid.uuid4()),
+            attempt=random.randint(1, 10000),
+        ),
+        TestActivityInfo(
+            workflow_id=f"{BATCH_EXPORT_ID}-Backfill-{dt.datetime.utcnow()}",
+            workflow_type="backfill-batch-export",
+            workflow_run_id=str(uuid.uuid4()),
+            attempt=random.randint(1, 10000),
+        ),
+    ],
+    indirect=True,
+)
+async def test_batch_exports_logger_binds_activity_context(
+    log_capture,
+    activity_environment,
+):
+    """Test whether our logger binds variables from a Temporal Activity."""
+
+    @temporalio.activity.defn
+    async def log_activity():
+        """A simple temporal activity that just logs."""
+        logger = await bind_batch_exports_logger(team_id=1, destination="Somewhere")
+
+        logger.info("Hi! This is an %s log from an activity", "info")
+
+    await activity_environment.run(log_activity)
+
+    assert len(log_capture.entries) == 1
+
+    info_dict = json.loads(log_capture.entries[0])
+    assert info_dict["team_id"] == 1
+    assert info_dict["destination"] == "Somewhere"
+    assert info_dict["workflow_id"] == activity_environment.info.workflow_id
+    assert info_dict["workflow_type"] == activity_environment.info.workflow_type
+    assert info_dict["log_source_id"] == BATCH_EXPORT_ID
+    assert info_dict["workflow_run_id"] == activity_environment.info.workflow_run_id
+    assert info_dict["attempt"] == activity_environment.info.attempt
+
+    if activity_environment.info.workflow_type == "backfill-batch-export":
+        assert info_dict["log_source"] == "batch_exports_backfill"
+    else:
+        assert info_dict["log_source"] == "batch_exports"
+
+
+@freezegun.freeze_time("2023-11-02 10:00:00.123123")
+@pytest.mark.parametrize(
+    "activity_environment",
+    [
+        TestActivityInfo(
+            workflow_id=f"{BATCH_EXPORT_ID}-{dt.datetime.utcnow()}",
+            workflow_type="s3-export",
+            workflow_run_id=str(uuid.uuid4()),
+            attempt=random.randint(1, 10000),
+        ),
+        TestActivityInfo(
+            workflow_id=f"{BATCH_EXPORT_ID}-Backfill-{dt.datetime.utcnow()}",
+            workflow_type="backfill-batch-export",
+            workflow_run_id=str(uuid.uuid4()),
+            attempt=random.randint(1, 10000),
+        ),
+    ],
+    indirect=True,
+)
+async def test_batch_exports_logger_puts_in_queue(activity_environment, queue):
+    """Test whether our logger puts entries into a queue for async processing."""
+
+    @temporalio.activity.defn
+    async def log_activity():
+        """A simple temporal activity that just logs."""
+        logger = await bind_batch_exports_logger(team_id=2, destination="Somewhere")
+
+        logger.info("Hi! This is an %s log from an activity", "info")
+
+    await activity_environment.run(log_activity)
+
+    assert len(queue.entries) == 1
+    message_dict = json.loads(queue.entries[0].decode("utf-8"))
+
+    assert message_dict["instance_id"] == activity_environment.info.workflow_run_id
+    assert message_dict["level"] == "info"
+
+    if activity_environment.info.workflow_type == "backfill-batch-export":
+        assert message_dict["log_source"] == "batch_exports_backfill"
+    else:
+        assert message_dict["log_source"] == "batch_exports"
+
+    assert message_dict["log_source_id"] == BATCH_EXPORT_ID
+    assert message_dict["message"] == "Hi! This is an info log from an activity"
+    assert message_dict["team_id"] == 2
+    assert message_dict["timestamp"] == "2023-11-02 10:00:00.123123"
+
+
+@pytest.fixture()
+def log_entries_table():
+    """Manage log_entries table for testing."""
+    sync_execute(KAFKA_LOG_ENTRIES_TABLE_SQL())
+    sync_execute(LOG_ENTRIES_TABLE_MV_SQL)
+    sync_execute(TRUNCATE_LOG_ENTRIES_TABLE_SQL)
+
+    yield LOG_ENTRIES_TABLE
+
+    sync_execute(f"DROP TABLE {LOG_ENTRIES_TABLE}_mv")
+    sync_execute(f"DROP TABLE kafka_{LOG_ENTRIES_TABLE}")
+    sync_execute(TRUNCATE_LOG_ENTRIES_TABLE_SQL)
+
+
+@freezegun.freeze_time("2023-11-03 10:00:00.123123")
+@pytest.mark.django_db
+@pytest.mark.parametrize(
+    "activity_environment",
+    [
+        TestActivityInfo(
+            workflow_id=f"{BATCH_EXPORT_ID}-{dt.datetime.utcnow()}",
+            workflow_type="s3-export",
+            workflow_run_id=str(uuid.uuid4()),
+            attempt=random.randint(1, 10000),
+        ),
+        TestActivityInfo(
+            workflow_id=f"{BATCH_EXPORT_ID}-Backfill-{dt.datetime.utcnow()}",
+            workflow_type="backfill-batch-export",
+            workflow_run_id=str(uuid.uuid4()),
+            attempt=random.randint(1, 10000),
+        ),
+    ],
+    indirect=True,
+)
+async def test_batch_exports_logger_produces_to_kafka(activity_environment, producer, queue, log_entries_table):
+    """Test whether our logger produces messages to Kafka.
+
+    We also check if those messages are ingested into ClickHouse.
+    """
+
+    @temporalio.activity.defn
+    async def log_activity():
+        """A simple temporal activity that just logs."""
+        logger = await bind_batch_exports_logger(team_id=3, destination="Somewhere")
+
+        logger.info("Hi! This is an %s log from an activity", "info")
+
+    await activity_environment.run(log_activity)
+    assert len(queue.entries) == 1
+
+    await queue.join()
+
+    if activity_environment.info.workflow_type == "backfill-batch-export":
+        expected_log_source = "batch_exports_backfill"
+    else:
+        expected_log_source = "batch_exports"
+
+    expected_dict = {
+        "instance_id": activity_environment.info.workflow_run_id,
+        "level": "info",
+        "log_source": expected_log_source,
+        "log_source_id": BATCH_EXPORT_ID,
+        "message": "Hi! This is an info log from an activity",
+        "team_id": 3,
+        "timestamp": "2023-11-03 10:00:00.123123",
+    }
+
+    assert len(producer.entries) == 1
+    assert producer.entries[0] == {
+        "topic": KAFKA_LOG_ENTRIES,
+        "value": json.dumps(expected_dict).encode("utf-8"),
+        "key": None,
+        "partition": None,
+        "timestamp_ms": None,
+        "headers": None,
+    }
+
+    results = sync_execute(
+        f"SELECT instance_id, level, log_source, log_source_id, message, team_id, timestamp FROM {log_entries_table}"
+    )
+
+    while not results:
+        # It may take a bit for CH to ingest.
+        time.sleep(2)
+        results = sync_execute(
+            f"SELECT instance_id, level, log_source, log_source_id, message, team_id, timestamp FROM {log_entries_table}"
+        )
+
+    assert len(results) == 1  # type: ignore
+
+    row = results[0]  # type: ignore
+    assert row[0] == activity_environment.info.workflow_run_id
+    assert row[1] == "info"
+    assert row[2] == expected_log_source
+    assert row[3] == BATCH_EXPORT_ID
+    assert row[4] == "Hi! This is an info log from an activity"
+    assert row[5] == 3
+    assert row[6].isoformat() == "2023-11-03T10:00:00.123123+00:00"