2021-11-15 23:23:49 +08:00
|
|
|
#!/usr/bin/python3
|
|
|
|
|
|
|
|
# Copyright 2021 Memgraph Ltd.
|
|
|
|
#
|
|
|
|
# Use of this software is governed by the Business Source License
|
|
|
|
# included in the file licenses/BSL.txt; by using this file, you agree to be bound by the terms of the Business Source
|
|
|
|
# License, and you may not use this file except in compliance with the Business Source License.
|
|
|
|
#
|
|
|
|
# As of the Change Date specified in that file, in accordance with
|
|
|
|
# the Business Source License, use of this software will be governed
|
|
|
|
# by the Apache License, Version 2.0, included in the file
|
|
|
|
# licenses/APL.txt.
|
|
|
|
|
|
|
|
import sys
|
|
|
|
import time
|
2023-12-21 03:03:06 +08:00
|
|
|
from multiprocessing import Process
|
|
|
|
|
2021-11-15 23:23:49 +08:00
|
|
|
import common
|
2023-12-21 03:03:06 +08:00
|
|
|
import mgclient
|
|
|
|
import pytest
|
|
|
|
from mg_utils import mg_sleep_and_assert
|
2021-11-15 23:23:49 +08:00
|
|
|
|
2022-06-20 20:09:45 +08:00
|
|
|
TRANSFORMATIONS_TO_CHECK_C = ["c_transformations.empty_transformation"]
|
2022-06-09 05:17:44 +08:00
|
|
|
TRANSFORMATIONS_TO_CHECK_PY = ["kafka_transform.simple", "kafka_transform.with_parameters"]
|
2023-12-21 03:03:06 +08:00
|
|
|
KAFKA_PRODUCER_SENDING_MSG_DEFAULT_TIMEOUT = 60
|
2022-04-29 02:28:44 +08:00
|
|
|
|
2021-11-15 23:23:49 +08:00
|
|
|
|
2022-04-29 02:28:44 +08:00
|
|
|
@pytest.mark.parametrize("transformation", TRANSFORMATIONS_TO_CHECK_PY)
|
2021-11-15 23:23:49 +08:00
|
|
|
def test_simple(kafka_producer, kafka_topics, connection, transformation):
|
|
|
|
assert len(kafka_topics) > 0
|
2023-12-21 03:03:06 +08:00
|
|
|
stream_name = "test_simple_" + transformation.split(".")[1]
|
|
|
|
|
2021-11-15 23:23:49 +08:00
|
|
|
cursor = connection.cursor()
|
2023-12-21 03:03:06 +08:00
|
|
|
common.create_stream(cursor, stream_name, ",".join(kafka_topics), transformation)
|
|
|
|
common.start_stream(cursor, stream_name)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
for topic in kafka_topics:
|
2023-12-21 03:03:06 +08:00
|
|
|
kafka_producer.send(topic, common.SIMPLE_MSG).get(timeout=KAFKA_PRODUCER_SENDING_MSG_DEFAULT_TIMEOUT)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
for topic in kafka_topics:
|
2022-06-09 05:17:44 +08:00
|
|
|
common.kafka_check_vertex_exists_with_topic_and_payload(cursor, topic, common.SIMPLE_MSG)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
|
2022-04-29 02:28:44 +08:00
|
|
|
@pytest.mark.parametrize("transformation", TRANSFORMATIONS_TO_CHECK_PY)
|
2022-06-09 05:17:44 +08:00
|
|
|
def test_separate_consumers(kafka_producer, kafka_topics, connection, transformation):
|
2021-11-15 23:23:49 +08:00
|
|
|
assert len(kafka_topics) > 0
|
|
|
|
cursor = connection.cursor()
|
|
|
|
|
2023-12-21 03:03:06 +08:00
|
|
|
stream_names = ["stream_" + transformation.split(".")[1] + "_" + topic for topic in kafka_topics]
|
2021-11-15 23:23:49 +08:00
|
|
|
|
2023-12-21 03:03:06 +08:00
|
|
|
for stream_name, topic in zip(stream_names, kafka_topics):
|
|
|
|
common.create_stream(cursor, stream_name, topic, transformation)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
2023-12-21 03:03:06 +08:00
|
|
|
common.start_streams(cursor, stream_names)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
for topic in kafka_topics:
|
2023-12-21 03:03:06 +08:00
|
|
|
kafka_producer.send(topic, common.SIMPLE_MSG).get(timeout=KAFKA_PRODUCER_SENDING_MSG_DEFAULT_TIMEOUT)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
for topic in kafka_topics:
|
2022-06-09 05:17:44 +08:00
|
|
|
common.kafka_check_vertex_exists_with_topic_and_payload(cursor, topic, common.SIMPLE_MSG)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
|
2022-06-09 05:17:44 +08:00
|
|
|
def test_start_from_last_committed_offset(kafka_producer, kafka_topics, connection):
|
2021-11-15 23:23:49 +08:00
|
|
|
# This test creates a stream, consumes a message to have a committed
|
|
|
|
# offset, then destroys the stream. A new message is sent before the
|
|
|
|
# stream is recreated and then restarted. This simulates when Memgraph is
|
|
|
|
# stopped (stream is destroyed) and then restarted (stream is recreated).
|
|
|
|
# This is of course not as good as restarting memgraph would be, but
|
|
|
|
# restarting Memgraph during a single workload cannot be done currently.
|
|
|
|
assert len(kafka_topics) > 0
|
|
|
|
cursor = connection.cursor()
|
|
|
|
|
2023-12-21 03:03:06 +08:00
|
|
|
stream_name = "test_start_from_last_committed_offset"
|
|
|
|
common.create_stream(cursor, stream_name, kafka_topics[0], "kafka_transform.simple")
|
|
|
|
common.start_stream(cursor, stream_name)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
2023-12-21 03:03:06 +08:00
|
|
|
kafka_producer.send(kafka_topics[0], common.SIMPLE_MSG).get(timeout=KAFKA_PRODUCER_SENDING_MSG_DEFAULT_TIMEOUT)
|
2022-06-09 05:17:44 +08:00
|
|
|
common.kafka_check_vertex_exists_with_topic_and_payload(cursor, kafka_topics[0], common.SIMPLE_MSG)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
2023-12-21 03:03:06 +08:00
|
|
|
common.stop_stream(cursor, stream_name)
|
|
|
|
common.drop_stream(cursor, stream_name)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
messages = [b"second message", b"third message"]
|
|
|
|
for message in messages:
|
2023-12-21 03:03:06 +08:00
|
|
|
kafka_producer.send(kafka_topics[0], message).get(timeout=KAFKA_PRODUCER_SENDING_MSG_DEFAULT_TIMEOUT)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
for message in messages:
|
|
|
|
vertices_with_msg = common.execute_and_fetch_all(
|
|
|
|
cursor,
|
2022-06-09 05:17:44 +08:00
|
|
|
f"MATCH (n: MESSAGE {{payload: '{message.decode('utf-8')}'}}) RETURN n",
|
2021-11-15 23:23:49 +08:00
|
|
|
)
|
|
|
|
|
|
|
|
assert len(vertices_with_msg) == 0
|
|
|
|
|
2023-12-21 03:03:06 +08:00
|
|
|
common.create_stream(cursor, stream_name, kafka_topics[0], "kafka_transform.simple")
|
|
|
|
common.start_stream(cursor, stream_name)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
for message in messages:
|
2022-06-09 05:17:44 +08:00
|
|
|
common.kafka_check_vertex_exists_with_topic_and_payload(cursor, kafka_topics[0], message)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
|
2022-04-29 02:28:44 +08:00
|
|
|
@pytest.mark.parametrize("transformation", TRANSFORMATIONS_TO_CHECK_PY)
|
2022-06-09 05:17:44 +08:00
|
|
|
def test_check_stream(kafka_producer, kafka_topics, connection, transformation):
|
2021-11-15 23:23:49 +08:00
|
|
|
assert len(kafka_topics) > 0
|
2022-06-09 05:17:44 +08:00
|
|
|
BATCH_SIZE = 1
|
|
|
|
INDEX_OF_FIRST_BATCH = 0
|
2023-12-21 03:03:06 +08:00
|
|
|
stream_name = "test_check_stream_" + transformation.split(".")[1]
|
|
|
|
|
2021-11-15 23:23:49 +08:00
|
|
|
cursor = connection.cursor()
|
|
|
|
|
2023-12-21 03:03:06 +08:00
|
|
|
common.create_stream(cursor, stream_name, kafka_topics[0], transformation, batch_size=BATCH_SIZE)
|
|
|
|
common.start_stream(cursor, stream_name)
|
|
|
|
kafka_producer.send(kafka_topics[0], common.SIMPLE_MSG).get(timeout=KAFKA_PRODUCER_SENDING_MSG_DEFAULT_TIMEOUT)
|
|
|
|
common.stop_stream(cursor, stream_name)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
messages = [b"first message", b"second message", b"third message"]
|
|
|
|
for message in messages:
|
2023-12-21 03:03:06 +08:00
|
|
|
kafka_producer.send(kafka_topics[0], message).get(timeout=KAFKA_PRODUCER_SENDING_MSG_DEFAULT_TIMEOUT)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
def check_check_stream(batch_limit):
|
2023-12-21 03:03:06 +08:00
|
|
|
test_results = common.execute_and_fetch_all(cursor, f"CHECK STREAM {stream_name} BATCH_LIMIT {batch_limit}")
|
2021-11-15 23:23:49 +08:00
|
|
|
assert len(test_results) == batch_limit
|
|
|
|
|
|
|
|
for i in range(batch_limit):
|
|
|
|
message_as_str = messages[i].decode("utf-8")
|
2023-12-21 03:03:06 +08:00
|
|
|
# If batch size != 1, then the usage of INDEX_OF_FIRST_BATCH must change: the result will have a list of queries (pair<parameters,query>)
|
2021-11-15 23:23:49 +08:00
|
|
|
if transformation == "kafka_transform.simple":
|
2022-06-09 05:17:44 +08:00
|
|
|
assert (
|
|
|
|
f"payload: '{message_as_str}'"
|
|
|
|
in test_results[i][common.QUERIES][INDEX_OF_FIRST_BATCH][common.QUERY_LITERAL]
|
|
|
|
)
|
|
|
|
assert test_results[i][common.QUERIES][INDEX_OF_FIRST_BATCH][common.PARAMETERS_LITERAL] is None
|
2021-11-15 23:23:49 +08:00
|
|
|
else:
|
2022-06-09 05:17:44 +08:00
|
|
|
assert (
|
|
|
|
f"payload: $payload" in test_results[i][common.QUERIES][INDEX_OF_FIRST_BATCH][common.QUERY_LITERAL]
|
|
|
|
and f"topic: $topic" in test_results[i][common.QUERIES][INDEX_OF_FIRST_BATCH][common.QUERY_LITERAL]
|
|
|
|
)
|
|
|
|
parameters = test_results[i][common.QUERIES][INDEX_OF_FIRST_BATCH][common.PARAMETERS_LITERAL]
|
2021-11-15 23:23:49 +08:00
|
|
|
# this is not a very sofisticated test, but checks if
|
|
|
|
# timestamp has some kind of value
|
|
|
|
assert parameters["timestamp"] > 1000000000000
|
|
|
|
assert parameters["topic"] == kafka_topics[0]
|
|
|
|
assert parameters["payload"] == message_as_str
|
|
|
|
|
|
|
|
check_check_stream(1)
|
|
|
|
check_check_stream(2)
|
|
|
|
check_check_stream(3)
|
2023-12-21 03:03:06 +08:00
|
|
|
common.start_stream(cursor, stream_name)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
for message in messages:
|
2022-06-09 05:17:44 +08:00
|
|
|
common.kafka_check_vertex_exists_with_topic_and_payload(cursor, kafka_topics[0], message)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
|
2023-12-21 03:03:06 +08:00
|
|
|
def test_show_streams(kafka_topics, connection):
|
2021-11-15 23:23:49 +08:00
|
|
|
assert len(kafka_topics) > 1
|
|
|
|
cursor = connection.cursor()
|
|
|
|
|
|
|
|
consumer_group = "my_special_consumer_group"
|
2022-06-09 05:17:44 +08:00
|
|
|
BATCH_INTERVAL = 42
|
|
|
|
BATCH_SIZE = 3
|
2023-12-21 03:03:06 +08:00
|
|
|
default_values_stream = "default_values"
|
|
|
|
complex_values_stream = "complex_values"
|
|
|
|
|
|
|
|
common.create_stream(
|
|
|
|
cursor, default_values_stream, kafka_topics[0], "kafka_transform.simple", bootstrap_servers="'localhost:29092'"
|
|
|
|
)
|
|
|
|
common.create_stream(
|
2021-11-15 23:23:49 +08:00
|
|
|
cursor,
|
2023-12-21 03:03:06 +08:00
|
|
|
complex_values_stream,
|
|
|
|
",".join(kafka_topics),
|
|
|
|
"kafka_transform.with_parameters",
|
|
|
|
consumer_group=consumer_group,
|
|
|
|
batch_interval=BATCH_INTERVAL,
|
|
|
|
batch_size=BATCH_SIZE,
|
2021-11-15 23:23:49 +08:00
|
|
|
)
|
|
|
|
|
|
|
|
assert len(common.execute_and_fetch_all(cursor, "SHOW STREAMS")) == 2
|
|
|
|
|
|
|
|
common.check_stream_info(
|
|
|
|
cursor,
|
2023-12-21 03:03:06 +08:00
|
|
|
default_values_stream,
|
|
|
|
(default_values_stream, "kafka", 100, 1000, "kafka_transform.simple", None, False),
|
2021-11-15 23:23:49 +08:00
|
|
|
)
|
|
|
|
|
|
|
|
common.check_stream_info(
|
|
|
|
cursor,
|
2023-12-21 03:03:06 +08:00
|
|
|
complex_values_stream,
|
2021-11-15 23:23:49 +08:00
|
|
|
(
|
2023-12-21 03:03:06 +08:00
|
|
|
complex_values_stream,
|
2021-11-16 22:10:49 +08:00
|
|
|
"kafka",
|
2022-06-09 05:17:44 +08:00
|
|
|
BATCH_INTERVAL,
|
|
|
|
BATCH_SIZE,
|
2021-11-15 23:23:49 +08:00
|
|
|
"kafka_transform.with_parameters",
|
|
|
|
None,
|
|
|
|
False,
|
|
|
|
),
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
@pytest.mark.parametrize("operation", ["START", "STOP"])
|
2022-06-09 05:17:44 +08:00
|
|
|
def test_start_and_stop_during_check(kafka_producer, kafka_topics, connection, operation):
|
2021-11-15 23:23:49 +08:00
|
|
|
assert len(kafka_topics) > 1
|
2022-06-09 05:17:44 +08:00
|
|
|
BATCH_SIZE = 1
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
def stream_creator(stream_name):
|
2022-06-09 05:17:44 +08:00
|
|
|
return f"CREATE KAFKA STREAM {stream_name} TOPICS {kafka_topics[0]} TRANSFORM kafka_transform.simple BATCH_SIZE {BATCH_SIZE}"
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
def message_sender(msg):
|
2023-12-21 03:03:06 +08:00
|
|
|
kafka_producer.send(kafka_topics[0], msg).get(timeout=KAFKA_PRODUCER_SENDING_MSG_DEFAULT_TIMEOUT)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
common.test_start_and_stop_during_check(
|
|
|
|
operation,
|
|
|
|
connection,
|
|
|
|
stream_creator,
|
|
|
|
message_sender,
|
2022-06-09 05:17:44 +08:00
|
|
|
"Kafka consumer test_stream is already stopped",
|
|
|
|
BATCH_SIZE,
|
|
|
|
)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
|
|
|
|
def test_check_already_started_stream(kafka_topics, connection):
|
|
|
|
assert len(kafka_topics) > 0
|
|
|
|
cursor = connection.cursor()
|
|
|
|
|
2023-12-21 03:03:06 +08:00
|
|
|
stream_name = "test_check_already_started_stream"
|
|
|
|
common.create_stream(cursor, stream_name, kafka_topics[0], "kafka_transform.simple")
|
|
|
|
common.start_stream(cursor, stream_name)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
with pytest.raises(mgclient.DatabaseError):
|
2023-12-21 03:03:06 +08:00
|
|
|
common.execute_and_fetch_all(cursor, f"CHECK STREAM {stream_name}")
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
|
|
|
|
def test_start_checked_stream_after_timeout(kafka_topics, connection):
|
|
|
|
def stream_creator(stream_name):
|
|
|
|
return f"CREATE KAFKA STREAM {stream_name} TOPICS {kafka_topics[0]} TRANSFORM kafka_transform.simple"
|
|
|
|
|
|
|
|
common.test_start_checked_stream_after_timeout(connection, stream_creator)
|
|
|
|
|
|
|
|
|
|
|
|
def test_restart_after_error(kafka_producer, kafka_topics, connection):
|
|
|
|
cursor = connection.cursor()
|
2023-12-21 03:03:06 +08:00
|
|
|
stream_name = "test_restart_after_error"
|
|
|
|
common.create_stream(cursor, stream_name, kafka_topics[0], "kafka_transform.query")
|
|
|
|
common.start_stream(cursor, stream_name)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
2023-12-21 03:03:06 +08:00
|
|
|
kafka_producer.send(kafka_topics[0], common.SIMPLE_MSG).get(timeout=KAFKA_PRODUCER_SENDING_MSG_DEFAULT_TIMEOUT)
|
|
|
|
assert common.timed_wait(lambda: not common.get_is_running(cursor, stream_name))
|
2021-11-15 23:23:49 +08:00
|
|
|
|
2023-12-21 03:03:06 +08:00
|
|
|
common.start_stream(cursor, stream_name)
|
2021-11-15 23:23:49 +08:00
|
|
|
kafka_producer.send(kafka_topics[0], b"CREATE (n:VERTEX { id : 42 })")
|
2022-06-09 05:17:44 +08:00
|
|
|
assert common.check_one_result_row(cursor, "MATCH (n:VERTEX { id : 42 }) RETURN n")
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
|
2022-04-29 02:28:44 +08:00
|
|
|
@pytest.mark.parametrize("transformation", TRANSFORMATIONS_TO_CHECK_PY)
|
2022-06-09 05:17:44 +08:00
|
|
|
def test_bootstrap_server(kafka_producer, kafka_topics, connection, transformation):
|
2021-11-15 23:23:49 +08:00
|
|
|
assert len(kafka_topics) > 0
|
|
|
|
cursor = connection.cursor()
|
2023-12-21 03:03:06 +08:00
|
|
|
local = "'localhost:29092'"
|
|
|
|
stream_name = "test_bootstrap_server_" + transformation.split(".")[1]
|
|
|
|
|
|
|
|
common.create_stream(cursor, stream_name, ",".join(kafka_topics), transformation, bootstrap_servers=local)
|
|
|
|
common.start_stream(cursor, stream_name)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
for topic in kafka_topics:
|
2023-12-21 03:03:06 +08:00
|
|
|
kafka_producer.send(topic, common.SIMPLE_MSG).get(timeout=KAFKA_PRODUCER_SENDING_MSG_DEFAULT_TIMEOUT)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
for topic in kafka_topics:
|
2022-06-09 05:17:44 +08:00
|
|
|
common.kafka_check_vertex_exists_with_topic_and_payload(cursor, topic, common.SIMPLE_MSG)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
|
2022-04-29 02:28:44 +08:00
|
|
|
@pytest.mark.parametrize("transformation", TRANSFORMATIONS_TO_CHECK_PY)
|
2023-12-21 03:03:06 +08:00
|
|
|
def test_bootstrap_server_empty(kafka_topics, connection, transformation):
|
2021-11-15 23:23:49 +08:00
|
|
|
assert len(kafka_topics) > 0
|
|
|
|
cursor = connection.cursor()
|
|
|
|
with pytest.raises(mgclient.DatabaseError):
|
|
|
|
common.execute_and_fetch_all(
|
|
|
|
cursor,
|
2022-06-09 05:17:44 +08:00
|
|
|
f"CREATE KAFKA STREAM test TOPICS {','.join(kafka_topics)} TRANSFORM {transformation} BOOTSTRAP_SERVERS ''",
|
2021-11-15 23:23:49 +08:00
|
|
|
)
|
|
|
|
|
|
|
|
|
2022-04-29 02:28:44 +08:00
|
|
|
@pytest.mark.parametrize("transformation", TRANSFORMATIONS_TO_CHECK_PY)
|
2021-11-16 23:12:38 +08:00
|
|
|
def test_set_offset(kafka_producer, kafka_topics, connection, transformation):
|
|
|
|
assert len(kafka_topics) > 0
|
2021-11-15 23:23:49 +08:00
|
|
|
cursor = connection.cursor()
|
|
|
|
common.execute_and_fetch_all(
|
|
|
|
cursor,
|
2022-06-09 05:17:44 +08:00
|
|
|
f"CREATE KAFKA STREAM test TOPICS {kafka_topics[0]} TRANSFORM {transformation} BATCH_SIZE 1",
|
2021-11-15 23:23:49 +08:00
|
|
|
)
|
|
|
|
|
|
|
|
messages = [f"{i} message" for i in range(1, 21)]
|
|
|
|
for message in messages:
|
2023-12-21 03:03:06 +08:00
|
|
|
kafka_producer.send(kafka_topics[0], message.encode()).get(timeout=KAFKA_PRODUCER_SENDING_MSG_DEFAULT_TIMEOUT)
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
def consume(expected_msgs):
|
|
|
|
common.start_stream(cursor, "test")
|
|
|
|
if len(expected_msgs) == 0:
|
|
|
|
time.sleep(2)
|
|
|
|
else:
|
|
|
|
assert common.check_one_result_row(
|
|
|
|
cursor,
|
2022-06-09 05:17:44 +08:00
|
|
|
(f"MATCH (n: MESSAGE {{payload: '{expected_msgs[-1]}'}})" "RETURN n"),
|
2021-11-15 23:23:49 +08:00
|
|
|
)
|
|
|
|
common.stop_stream(cursor, "test")
|
2022-06-09 05:17:44 +08:00
|
|
|
res = common.execute_and_fetch_all(cursor, "MATCH (n) RETURN n.payload")
|
2021-11-15 23:23:49 +08:00
|
|
|
return res
|
|
|
|
|
|
|
|
def execute_set_offset_and_consume(id, expected_msgs):
|
2022-06-09 05:17:44 +08:00
|
|
|
common.execute_and_fetch_all(cursor, f"CALL mg.kafka_set_stream_offset('test', {id})")
|
2021-11-15 23:23:49 +08:00
|
|
|
return consume(expected_msgs)
|
|
|
|
|
|
|
|
with pytest.raises(mgclient.DatabaseError):
|
2022-06-09 05:17:44 +08:00
|
|
|
res = common.execute_and_fetch_all(cursor, "CALL mg.kafka_set_stream_offset('foo', 10)")
|
2021-11-15 23:23:49 +08:00
|
|
|
|
|
|
|
def comparison_check(a, b):
|
|
|
|
return a == str(b).strip("'(,)")
|
|
|
|
|
|
|
|
res = execute_set_offset_and_consume(10, messages[10:])
|
|
|
|
assert len(res) == 10
|
|
|
|
assert all([comparison_check(a, b) for a, b in zip(messages[10:], res)])
|
|
|
|
common.execute_and_fetch_all(cursor, "MATCH (n) DETACH DELETE n")
|
|
|
|
|
|
|
|
res = execute_set_offset_and_consume(-1, messages)
|
|
|
|
assert len(res) == len(messages)
|
|
|
|
assert all([comparison_check(a, b) for a, b in zip(messages, res)])
|
|
|
|
res = common.execute_and_fetch_all(cursor, "MATCH (n) return n.offset")
|
|
|
|
assert all([comparison_check(str(i), res[i]) for i in range(1, 20)])
|
|
|
|
res = common.execute_and_fetch_all(cursor, "MATCH (n) DETACH DELETE n")
|
|
|
|
|
|
|
|
res = execute_set_offset_and_consume(-2, [])
|
|
|
|
assert len(res) == 0
|
|
|
|
last_msg = "Final Message"
|
2023-12-21 03:03:06 +08:00
|
|
|
kafka_producer.send(kafka_topics[0], last_msg.encode()).get(timeout=KAFKA_PRODUCER_SENDING_MSG_DEFAULT_TIMEOUT)
|
2021-11-15 23:23:49 +08:00
|
|
|
res = consume([last_msg])
|
|
|
|
assert len(res) == 1
|
|
|
|
assert comparison_check("Final Message", res[0])
|
|
|
|
common.execute_and_fetch_all(cursor, "MATCH (n) DETACH DELETE n")
|
|
|
|
|
2022-02-01 00:26:53 +08:00
|
|
|
|
2021-11-29 15:56:10 +08:00
|
|
|
def test_info_procedure(kafka_topics, connection):
|
|
|
|
cursor = connection.cursor()
|
2023-12-21 03:03:06 +08:00
|
|
|
stream_name = "test_stream"
|
|
|
|
configs = {"sasl.username": "michael.scott"}
|
|
|
|
local = "localhost:29092"
|
|
|
|
credentials = {"sasl.password": "S3cr3tP4ssw0rd"}
|
|
|
|
consumer_group = "ConsumerGr"
|
|
|
|
|
|
|
|
common.create_stream(
|
2021-11-29 15:56:10 +08:00
|
|
|
cursor,
|
2023-12-21 03:03:06 +08:00
|
|
|
stream_name,
|
|
|
|
",".join(kafka_topics),
|
|
|
|
"kafka_transform.simple",
|
|
|
|
consumer_group=consumer_group,
|
|
|
|
bootstrap_servers=f"'{local}'",
|
|
|
|
configs=configs,
|
|
|
|
credentials=credentials,
|
2021-11-29 15:56:10 +08:00
|
|
|
)
|
2023-12-21 03:03:06 +08:00
|
|
|
stream_info = common.execute_and_fetch_all(cursor, f"CALL mg.kafka_stream_info('{stream_name}') YIELD *")
|
2021-11-29 15:56:10 +08:00
|
|
|
|
2023-12-21 03:03:06 +08:00
|
|
|
reducted_credentials = {key: "<REDUCTED>" for key in credentials.keys()}
|
2021-11-29 15:56:10 +08:00
|
|
|
|
2023-12-21 03:03:06 +08:00
|
|
|
expected_stream_info = [(local, configs, consumer_group, reducted_credentials, kafka_topics)]
|
2021-11-29 15:56:10 +08:00
|
|
|
common.validate_info(stream_info, expected_stream_info)
|
|
|
|
|
2022-06-09 05:17:44 +08:00
|
|
|
|
|
|
|
@pytest.mark.parametrize("transformation", TRANSFORMATIONS_TO_CHECK_C)
|
2022-04-29 02:28:44 +08:00
|
|
|
def test_load_c_transformations(connection, transformation):
|
|
|
|
cursor = connection.cursor()
|
2022-06-20 20:09:45 +08:00
|
|
|
|
|
|
|
query = f"CALL mg.transformations() YIELD * WITH name WHERE name STARTS WITH '{transformation}' RETURN name"
|
2022-06-09 05:17:44 +08:00
|
|
|
result = common.execute_and_fetch_all(cursor, query)
|
2022-04-29 02:28:44 +08:00
|
|
|
assert len(result) == 1
|
2022-06-20 20:09:45 +08:00
|
|
|
assert result[0][0] == transformation
|
2022-06-09 05:17:44 +08:00
|
|
|
|
|
|
|
|
|
|
|
def test_check_stream_same_number_of_queries_than_messages(kafka_producer, kafka_topics, connection):
|
|
|
|
assert len(kafka_topics) > 0
|
|
|
|
|
|
|
|
TRANSFORMATION = "common_transform.check_stream_no_filtering"
|
|
|
|
|
|
|
|
def stream_creator(stream_name, batch_size):
|
|
|
|
return f"CREATE KAFKA STREAM {stream_name} TOPICS {kafka_topics[0]} TRANSFORM {TRANSFORMATION} BATCH_INTERVAL 3000 BATCH_SIZE {batch_size}"
|
|
|
|
|
|
|
|
def message_sender(msg):
|
2023-12-21 03:03:06 +08:00
|
|
|
kafka_producer.send(kafka_topics[0], msg).get(timeout=KAFKA_PRODUCER_SENDING_MSG_DEFAULT_TIMEOUT)
|
2022-06-09 05:17:44 +08:00
|
|
|
|
|
|
|
common.test_check_stream_same_number_of_queries_than_messages(connection, stream_creator, message_sender)
|
|
|
|
|
|
|
|
|
|
|
|
def test_check_stream_different_number_of_queries_than_messages(kafka_producer, kafka_topics, connection):
|
|
|
|
assert len(kafka_topics) > 0
|
|
|
|
|
|
|
|
TRANSFORMATION = "common_transform.check_stream_with_filtering"
|
|
|
|
|
|
|
|
def stream_creator(stream_name, batch_size):
|
2023-12-21 03:03:06 +08:00
|
|
|
return f"CREATE KAFKA STREAM {stream_name} TOPICS {kafka_topics[0]} TRANSFORM {TRANSFORMATION} BATCH_INTERVAL 3000 BATCH_SIZE {batch_size}"
|
2022-06-09 05:17:44 +08:00
|
|
|
|
|
|
|
def message_sender(msg):
|
2023-12-21 03:03:06 +08:00
|
|
|
kafka_producer.send(kafka_topics[0], msg).get(timeout=KAFKA_PRODUCER_SENDING_MSG_DEFAULT_TIMEOUT)
|
2022-06-09 05:17:44 +08:00
|
|
|
|
|
|
|
common.test_check_stream_different_number_of_queries_than_messages(connection, stream_creator, message_sender)
|
|
|
|
|
|
|
|
|
2022-06-20 20:09:45 +08:00
|
|
|
def test_start_stream_with_batch_limit(kafka_producer, kafka_topics, connection):
|
|
|
|
assert len(kafka_topics) > 0
|
2023-12-21 03:03:06 +08:00
|
|
|
STREAM_NAME = "test_start_stream_with_batch_limit"
|
2022-06-20 20:09:45 +08:00
|
|
|
|
2023-12-21 03:03:06 +08:00
|
|
|
def stream_creator():
|
2022-06-20 20:09:45 +08:00
|
|
|
return (
|
2023-12-21 03:03:06 +08:00
|
|
|
f"CREATE KAFKA STREAM {STREAM_NAME} TOPICS {kafka_topics[0]} TRANSFORM kafka_transform.simple BATCH_SIZE 1"
|
2022-06-20 20:09:45 +08:00
|
|
|
)
|
|
|
|
|
|
|
|
def messages_sender(nof_messages):
|
2023-12-21 03:03:06 +08:00
|
|
|
for _ in range(nof_messages):
|
|
|
|
kafka_producer.send(kafka_topics[0], common.SIMPLE_MSG).get(
|
|
|
|
timeout=KAFKA_PRODUCER_SENDING_MSG_DEFAULT_TIMEOUT
|
|
|
|
)
|
2022-06-20 20:09:45 +08:00
|
|
|
|
2023-12-21 03:03:06 +08:00
|
|
|
common.test_start_stream_with_batch_limit(connection, STREAM_NAME, stream_creator, messages_sender)
|
2022-06-20 20:09:45 +08:00
|
|
|
|
|
|
|
|
2023-12-21 03:03:06 +08:00
|
|
|
def test_start_stream_with_batch_limit_timeout(kafka_topics, connection):
|
2022-06-20 20:09:45 +08:00
|
|
|
assert len(kafka_topics) > 0
|
|
|
|
|
|
|
|
def stream_creator(stream_name):
|
|
|
|
return (
|
|
|
|
f"CREATE KAFKA STREAM {stream_name} TOPICS {kafka_topics[0]} TRANSFORM kafka_transform.simple BATCH_SIZE 1"
|
|
|
|
)
|
|
|
|
|
|
|
|
common.test_start_stream_with_batch_limit_timeout(connection, stream_creator)
|
|
|
|
|
|
|
|
|
2023-12-21 03:03:06 +08:00
|
|
|
def test_start_stream_with_batch_limit_reaching_timeout(kafka_topics, connection):
|
2022-06-20 20:09:45 +08:00
|
|
|
assert len(kafka_topics) > 0
|
|
|
|
|
|
|
|
def stream_creator(stream_name, batch_size):
|
|
|
|
return f"CREATE KAFKA STREAM {stream_name} TOPICS {kafka_topics[0]} TRANSFORM kafka_transform.simple BATCH_SIZE {batch_size}"
|
|
|
|
|
|
|
|
common.test_start_stream_with_batch_limit_reaching_timeout(connection, stream_creator)
|
|
|
|
|
|
|
|
|
|
|
|
def test_start_stream_with_batch_limit_while_check_running(kafka_producer, kafka_topics, connection):
|
|
|
|
assert len(kafka_topics) > 0
|
|
|
|
|
|
|
|
def stream_creator(stream_name):
|
|
|
|
return (
|
|
|
|
f"CREATE KAFKA STREAM {stream_name} TOPICS {kafka_topics[0]} TRANSFORM kafka_transform.simple BATCH_SIZE 1"
|
|
|
|
)
|
|
|
|
|
|
|
|
def message_sender(message):
|
2023-12-21 03:03:06 +08:00
|
|
|
kafka_producer.send(kafka_topics[0], message).get(timeout=KAFKA_PRODUCER_SENDING_MSG_DEFAULT_TIMEOUT)
|
2022-06-20 20:09:45 +08:00
|
|
|
|
|
|
|
def setup_function(start_check_stream, cursor, stream_name, batch_limit, timeout):
|
|
|
|
thread_stream_check = Process(target=start_check_stream, daemon=True, args=(stream_name, batch_limit, timeout))
|
|
|
|
thread_stream_check.start()
|
2022-07-08 16:47:18 +08:00
|
|
|
|
|
|
|
def is_running():
|
|
|
|
return common.get_is_running(cursor, stream_name)
|
|
|
|
|
|
|
|
assert mg_sleep_and_assert(True, is_running)
|
2022-06-20 20:09:45 +08:00
|
|
|
message_sender(common.SIMPLE_MSG)
|
|
|
|
thread_stream_check.join()
|
|
|
|
|
|
|
|
common.test_start_stream_with_batch_limit_while_check_running(
|
|
|
|
connection, stream_creator, message_sender, setup_function
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
def test_check_while_stream_with_batch_limit_running(kafka_producer, kafka_topics, connection):
|
|
|
|
assert len(kafka_topics) > 0
|
|
|
|
|
|
|
|
def stream_creator(stream_name):
|
|
|
|
return (
|
|
|
|
f"CREATE KAFKA STREAM {stream_name} TOPICS {kafka_topics[0]} TRANSFORM kafka_transform.simple BATCH_SIZE 1"
|
|
|
|
)
|
|
|
|
|
|
|
|
def message_sender(message):
|
2023-12-21 03:03:06 +08:00
|
|
|
kafka_producer.send(kafka_topics[0], message).get(timeout=KAFKA_PRODUCER_SENDING_MSG_DEFAULT_TIMEOUT)
|
2022-06-20 20:09:45 +08:00
|
|
|
|
|
|
|
common.test_check_while_stream_with_batch_limit_running(connection, stream_creator, message_sender)
|
|
|
|
|
|
|
|
|
2023-12-21 03:03:06 +08:00
|
|
|
def test_start_stream_with_batch_limit_with_invalid_batch_limit(kafka_topics, connection):
|
2022-06-20 20:09:45 +08:00
|
|
|
assert len(kafka_topics) > 0
|
|
|
|
|
|
|
|
def stream_creator(stream_name):
|
|
|
|
return (
|
|
|
|
f"CREATE KAFKA STREAM {stream_name} TOPICS {kafka_topics[0]} TRANSFORM kafka_transform.simple BATCH_SIZE 1"
|
|
|
|
)
|
|
|
|
|
|
|
|
common.test_start_stream_with_batch_limit_with_invalid_batch_limit(connection, stream_creator)
|
|
|
|
|
|
|
|
|
2023-12-21 03:03:06 +08:00
|
|
|
def test_check_stream_with_batch_limit_with_invalid_batch_limit(kafka_topics, connection):
|
2022-06-20 20:09:45 +08:00
|
|
|
assert len(kafka_topics) > 0
|
|
|
|
|
|
|
|
def stream_creator(stream_name):
|
|
|
|
return (
|
|
|
|
f"CREATE KAFKA STREAM {stream_name} TOPICS {kafka_topics[0]} TRANSFORM kafka_transform.simple BATCH_SIZE 1"
|
|
|
|
)
|
|
|
|
|
|
|
|
common.test_check_stream_with_batch_limit_with_invalid_batch_limit(connection, stream_creator)
|
|
|
|
|
|
|
|
|
2021-11-15 23:23:49 +08:00
|
|
|
if __name__ == "__main__":
|
|
|
|
sys.exit(pytest.main([__file__, "-rA"]))
|