generated from canonical/template-operator
-
Notifications
You must be signed in to change notification settings - Fork 14
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
[DPE-2366][DPE-2365] HA tests #129
Merged
Merged
Changes from all commits
Commits
Show all changes
22 commits
Select commit
Hold shift + click to select a range
73e2217
add two cluster ha test
zmraul 13d857e
add test to CI
zmraul fd8aafa
restructure tests pipeline
zmraul 60e6e7a
fix lint
zmraul 4cbdadb
tell better joke to the pipeline
zmraul 2c38803
add tests and restructure
zmraul b352065
Merge branch 'test/high-availability' into test/dpe-2366-read-secondary
zmraul ca80901
fix kafka command
zmraul 8db9f39
fix produce logs
zmraul 239f713
general fixes
zmraul 2c42417
add pr feedback and remove unused files
zmraul 4989b11
fix test
zmraul cc35140
fix
zmraul e02dd84
restructure tests
zmraul d9f6623
add continuous writes structure
zmraul 316ca00
redo kill broker test with continuous writes
zmraul d80831e
fix imports
zmraul 0e82c7e
add delay to restart
zmraul ca356d8
fix lint
zmraul 413492e
fix asserts
zmraul b2271d4
general fixes
zmraul ffd4485
add pf feedback
zmraul File filter
Filter by extension
Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -7,4 +7,5 @@ __pycache__/ | |
*.py[cod] | ||
.vscode | ||
.idea | ||
.python-version | ||
.python-version | ||
last_written_value |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1 @@ | ||
20052,0 |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,2 @@ | ||
# Copyright 2023 Canonical Ltd. | ||
# See LICENSE file for licensing details. |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,220 @@ | ||
#!/usr/bin/env python3 | ||
# Copyright 2023 Canonical Ltd. | ||
# See LICENSE file for licensing details. | ||
import asyncio | ||
import logging | ||
import os | ||
from multiprocessing import Event, Process, Queue | ||
from types import SimpleNamespace | ||
|
||
from charms.kafka.v0.client import KafkaClient | ||
from kafka.admin import NewTopic | ||
from kafka.errors import KafkaTimeoutError | ||
from pytest_operator.plugin import OpsTest | ||
from tenacity import ( | ||
RetryError, | ||
Retrying, | ||
retry, | ||
stop_after_attempt, | ||
stop_after_delay, | ||
wait_fixed, | ||
wait_random, | ||
) | ||
|
||
from integration.helpers import DUMMY_NAME, get_provider_data | ||
|
||
logger = logging.getLogger(__name__) | ||
|
||
|
||
class ContinuousWrites: | ||
"""Utility class for managing continuous writes.""" | ||
|
||
TOPIC_NAME = "ha-test-topic" | ||
LAST_WRITTEN_VAL_PATH = "last_written_value" | ||
|
||
def __init__(self, ops_test: OpsTest, app: str): | ||
self._ops_test = ops_test | ||
self._app = app | ||
self._is_stopped = True | ||
self._event = None | ||
self._queue = None | ||
self._process = None | ||
|
||
@retry( | ||
wait=wait_fixed(wait=5) + wait_random(0, 5), | ||
stop=stop_after_attempt(5), | ||
) | ||
def start(self) -> None: | ||
"""Run continuous writes in the background.""" | ||
if not self._is_stopped: | ||
self.clear() | ||
|
||
# create topic | ||
self._create_replicated_topic() | ||
|
||
# create process | ||
self._create_process() | ||
|
||
# pass the model full name to the process once it starts | ||
self.update() | ||
|
||
# start writes | ||
self._process.start() | ||
|
||
def update(self): | ||
"""Update cluster related conf. Useful in cases such as scaling, pwd change etc.""" | ||
self._queue.put(SimpleNamespace(model_full_name=self._ops_test.model_full_name)) | ||
|
||
@retry( | ||
wait=wait_fixed(wait=5) + wait_random(0, 5), | ||
stop=stop_after_attempt(5), | ||
) | ||
def clear(self) -> None: | ||
"""Stop writes and delete the topic.""" | ||
if not self._is_stopped: | ||
self.stop() | ||
|
||
client = self._client() | ||
try: | ||
client.delete_topics(topics=[self.TOPIC_NAME]) | ||
finally: | ||
client.close() | ||
|
||
def consumed_messages(self) -> list | None: | ||
"""Consume the messages in the topic.""" | ||
client = self._client() | ||
try: | ||
for attempt in Retrying(stop=stop_after_attempt(5), wait=wait_fixed(5)): | ||
with attempt: | ||
client.subscribe_to_topic(topic_name=self.TOPIC_NAME) | ||
# FIXME: loading whole list of consumed messages into memory might not be the best idea | ||
return list(client.messages()) | ||
except RetryError: | ||
return [] | ||
finally: | ||
client.close() | ||
|
||
def _create_replicated_topic(self): | ||
"""Create topic with replication_factor = 3.""" | ||
client = self._client() | ||
topic_config = NewTopic( | ||
name=self.TOPIC_NAME, | ||
num_partitions=1, | ||
replication_factor=3, | ||
) | ||
client.create_topic(topic=topic_config) | ||
|
||
@retry( | ||
wait=wait_fixed(wait=5) + wait_random(0, 5), | ||
stop=stop_after_attempt(5), | ||
) | ||
def stop(self) -> SimpleNamespace: | ||
"""Stop the continuous writes process and return max inserted ID.""" | ||
if not self._is_stopped: | ||
self._stop_process() | ||
|
||
result = SimpleNamespace() | ||
|
||
# messages count | ||
consumed_messages = self.consumed_messages() | ||
result.count = len(consumed_messages) | ||
result.last_message = consumed_messages[-1] | ||
|
||
# last expected message stored on disk | ||
try: | ||
for attempt in Retrying(stop=stop_after_delay(60), wait=wait_fixed(5)): | ||
with attempt: | ||
with open(ContinuousWrites.LAST_WRITTEN_VAL_PATH, "r") as f: | ||
result.last_expected_message, result.lost_messages = ( | ||
f.read().rstrip().split(",", maxsplit=2) | ||
) | ||
except RetryError: | ||
result.last_expected_message = result.lost_messages = -1 | ||
|
||
return result | ||
|
||
def _create_process(self): | ||
self._is_stopped = False | ||
self._event = Event() | ||
self._queue = Queue() | ||
self._process = Process( | ||
target=ContinuousWrites._run_async, | ||
name="continuous_writes", | ||
args=(self._event, self._queue, 0), | ||
) | ||
|
||
def _stop_process(self): | ||
self._event.set() | ||
self._process.join() | ||
self._queue.close() | ||
self._is_stopped = True | ||
|
||
def _client(self): | ||
"""Build a Kafka client.""" | ||
relation_data = get_provider_data( | ||
unit_name=f"{DUMMY_NAME}/0", | ||
model_full_name=self._ops_test.model_full_name, | ||
endpoint="kafka-client-admin", | ||
) | ||
return KafkaClient( | ||
servers=relation_data["endpoints"].split(","), | ||
username=relation_data["username"], | ||
password=relation_data["password"], | ||
security_protocol="SASL_PLAINTEXT", | ||
) | ||
|
||
@staticmethod | ||
async def _run(event: Event, data_queue: Queue, starting_number: int) -> None: # noqa: C901 | ||
"""Continuous writing.""" | ||
initial_data = data_queue.get(True) | ||
|
||
def _client(): | ||
"""Build a Kafka client.""" | ||
relation_data = get_provider_data( | ||
unit_name=f"{DUMMY_NAME}/0", | ||
model_full_name=initial_data.model_full_name, | ||
endpoint="kafka-client-admin", | ||
) | ||
return KafkaClient( | ||
servers=relation_data["endpoints"].split(","), | ||
username=relation_data["username"], | ||
password=relation_data["password"], | ||
security_protocol="SASL_PLAINTEXT", | ||
) | ||
|
||
write_value = starting_number | ||
lost_messages = 0 | ||
client = _client() | ||
|
||
while True: | ||
if not data_queue.empty(): # currently evaluates to false as we don't make updates | ||
data_queue.get(False) | ||
client.close() | ||
client = _client() | ||
|
||
try: | ||
client.produce_message( | ||
topic_name=ContinuousWrites.TOPIC_NAME, message_content=str(write_value) | ||
) | ||
except KafkaTimeoutError: | ||
client.close() | ||
client = _client() | ||
lost_messages += 1 | ||
finally: | ||
# process termination requested | ||
if event.is_set(): | ||
break | ||
|
||
write_value += 1 | ||
|
||
# write last expected written value on disk | ||
with open(ContinuousWrites.LAST_WRITTEN_VAL_PATH, "w") as f: | ||
f.write(f"{str(write_value)},{str(lost_messages)}") | ||
os.fsync(f) | ||
|
||
client.close() | ||
|
||
@staticmethod | ||
def _run_async(event: Event, data_queue: Queue, starting_number: int): | ||
"""Run async code.""" | ||
asyncio.run(ContinuousWrites._run(event, data_queue, starting_number)) |
Oops, something went wrong.
Add this suggestion to a batch that can be applied as a single commit.
This suggestion is invalid because no changes were made to the code.
Suggestions cannot be applied while the pull request is closed.
Suggestions cannot be applied while viewing a subset of changes.
Only one suggestion per line can be applied in a batch.
Add this suggestion to a batch that can be applied as a single commit.
Applying suggestions on deleted lines is not supported.
You must change the existing code in this line in order to create a valid suggestion.
Outdated suggestions cannot be applied.
This suggestion has been applied or marked resolved.
Suggestions cannot be applied from pending reviews.
Suggestions cannot be applied on multi-line comments.
Suggestions cannot be applied while the pull request is queued to merge.
Suggestion cannot be applied right now. Please check back later.
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
nit: this could perhaps be externalized in a helper, so it can be called from the
_run._client()
function without having to duplicate it