Skip to content

Commit

Permalink
Fix log arrival timezone (#715)
Browse files Browse the repository at this point in the history
* Add option to TimeParser to get current timestamp with timezone
* Fix timezone in log arrival and delta time
* Add TimeParser and log arrival time changes to changelog

---------

Co-authored-by: dtrai2 <[email protected]>
  • Loading branch information
ppcad and dtrai2 authored Dec 9, 2024
1 parent b20afb6 commit ccad610
Show file tree
Hide file tree
Showing 4 changed files with 34 additions and 13 deletions.
2 changes: 2 additions & 0 deletions CHANGELOG.md
Original file line number Diff line number Diff line change
Expand Up @@ -26,6 +26,7 @@ the list is now fixed inside the packaged logprep
* refactored some processors to make use of the new helper methods
* add `pre-commit` hooks to the repository, install new dev dependency and run `pre-commit install` in the root dir
* the default `securityContext`for the pod is now configurable
* allow `TimeParser` to get the current time with a specified timezone instead of always using local time and setting the timezone to UTC
* remove `tldextract` dependency
* remove `urlextract` dependency

Expand All @@ -34,6 +35,7 @@ the list is now fixed inside the packaged logprep
* fix `confluent_kafka.store_offsets` if `last_valid_record` is `None`, can happen if a rebalancing happens
before the first message was pulled.
* fix pseudonymizer cache metrics not updated
* fix incorrect timezones for log arrival time and delta time in input preprocessing
* fix `_get_value` in `FilterExpression` so that keys don't match on values
* fix `auto_rule_tester` to work with `LOGPREP_BYPASS_RULE_TREE` enabled

Expand Down
17 changes: 10 additions & 7 deletions logprep/abc/input.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,9 +8,10 @@
import zlib
from abc import abstractmethod
from copy import deepcopy
from functools import partial
from functools import partial, cached_property
from hmac import HMAC
from typing import Optional, Tuple
from zoneinfo import ZoneInfo

from attrs import define, field, validators

Expand Down Expand Up @@ -198,6 +199,11 @@ def _add_version_info(self):
"""Check and return if the version info should be added to the event."""
return bool(self._config.preprocessing.get("version_info_target_field"))

@cached_property
def _log_arrival_timestamp_timezone(self):
"""Returns the timezone for log arrival timestamps"""
return ZoneInfo("UTC")

@property
def _add_log_arrival_time_information(self):
"""Check and return if the log arrival time info should be added to the event."""
Expand Down Expand Up @@ -311,12 +317,9 @@ def _add_env_enrichment_to_event(self, event: dict):
add_fields_to(event, fields)

def _add_arrival_time_information_to_event(self, event: dict):
new_field = {
self._config.preprocessing.get(
"log_arrival_time_target_field"
): TimeParser.now().isoformat()
}
add_fields_to(event, new_field)
target = self._config.preprocessing.get("log_arrival_time_target_field")
time = TimeParser.now(self._log_arrival_timestamp_timezone).isoformat()
add_fields_to(event, {target: time})

def _add_arrival_timedelta_information_to_event(self, event: dict):
log_arrival_timedelta_config = self._config.preprocessing.get("log_arrival_timedelta")
Expand Down
9 changes: 7 additions & 2 deletions logprep/util/time.py
Original file line number Diff line number Diff line change
Expand Up @@ -61,15 +61,20 @@ def from_timestamp(cls, timestamp: Union[int, float]) -> datetime:
return time_object

@classmethod
def now(cls) -> datetime:
def now(cls, timezone: tzinfo = None) -> datetime:
"""returns the current time
Parameters
----------
timezone : tzinfo
the timezone to use for the timestamp
Returns
-------
datetime
current date and time as datetime
"""
time_object = datetime.now()
time_object = datetime.now(timezone)
time_object = cls._set_utc_if_timezone_is_missing(time_object)
return time_object

Expand Down
19 changes: 15 additions & 4 deletions tests/unit/util/test_time.py
Original file line number Diff line number Diff line change
Expand Up @@ -60,11 +60,22 @@ def test_from_format_returns(self, source, format_str, expected):
for attribute, value in expected.items():
assert getattr(timestamp, attribute) == value

@pytest.mark.parametrize("timezone", [None, ZoneInfo("UTC"), ZoneInfo("Europe/Berlin")])
def test_has_utc_if_timezone_was_set(self, timezone):
datetime_time = datetime.now(timezone)
time_parser_time = TimeParser.now(timezone)
assert time_parser_time.second == pytest.approx(datetime_time.second, abs=1)
if timezone is None:
assert time_parser_time.tzinfo == ZoneInfo("UTC")
else:
assert time_parser_time.tzinfo == timezone

def test_set_utc_if_timezone_is_missing_sets_timezone(self):
time_object = datetime.now()
assert time_object.tzinfo is None
time_object = TimeParser._set_utc_if_timezone_is_missing(time_object)
assert time_object.tzinfo is ZoneInfo("UTC")
datetime_time = datetime.now()
assert datetime_time.tzinfo is None
time_parser_time = TimeParser._set_utc_if_timezone_is_missing(datetime_time)
assert time_parser_time.tzinfo is ZoneInfo("UTC")
assert time_parser_time.second == pytest.approx(datetime_time.second, abs=1)

@pytest.mark.parametrize(
"timestamp, source_format, source_timezone, expected_timezone_name, expected",
Expand Down

0 comments on commit ccad610

Please sign in to comment.