From fe9c56da9189b2d57dc1e365448b40b1410bb227 Mon Sep 17 00:00:00 2001
From: Pavel Tisnovsky <ptisnovs@redhat.com>
Date: Mon, 16 Feb 2026 11:11:07 +0100
Subject: [PATCH 1/2] Refactored existing benchmarks

---
 tests/benchmarks/conftest.py          | 120 +++++
 tests/benchmarks/data_generators.py   | 159 +++++++
 tests/benchmarks/db_benchmarks.py     | 334 ++++++++++++++
 tests/benchmarks/test_app_database.py | 605 +-------------------------
 4 files changed, 621 insertions(+), 597 deletions(-)
 create mode 100644 tests/benchmarks/conftest.py
 create mode 100644 tests/benchmarks/data_generators.py
 create mode 100644 tests/benchmarks/db_benchmarks.py

diff --git a/tests/benchmarks/conftest.py b/tests/benchmarks/conftest.py
new file mode 100644
index 000000000..82a40b67d
--- /dev/null
+++ b/tests/benchmarks/conftest.py
@@ -0,0 +1,120 @@
+"""Fixtures used by benchmarks."""
+
+from pathlib import Path
+import pytest
+
+import psycopg2
+
+from app import database
+from configuration import configuration, AppConfig
+
+
+@pytest.fixture(name="configuration_filename_sqlite")
+def configuration_filename_sqlite_fixture() -> str:
+    """Retrieve configuration file name to be used by benchmarks.
+
+    Parameters:
+        None
+
+    Returns:
+        str: Path to the benchmark configuration file to load.
+    """
+    return "tests/configuration/benchmarks-sqlite.yaml"
+
+
+@pytest.fixture(name="configuration_filename_postgres")
+def configuration_filename_postgres_fixture() -> str:
+    """Retrieve configuration file name to be used by benchmarks.
+
+    Parameters:
+        None
+
+    Returns:
+        str: Path to the benchmark configuration file to load.
+    """
+    return "tests/configuration/benchmarks-postgres.yaml"
+
+
+@pytest.fixture(name="sqlite_database")
+def sqlite_database_fixture(configuration_filename_sqlite: str, tmp_path: Path) -> None:
+    """Initialize a temporary SQLite database for benchmarking.
+
+    This fixture:
+    - Loads the provided configuration file.
+    - Ensures an SQLite configuration is present.
+    - Uses a temp path for the SQLite DB file to guarantee a fresh DB for each run.
+    - Initializes the DB engine and creates required tables.
+
+    Parameters:
+        configuration_filename_sqlite (str): Path to the YAML configuration file to load.
+        tmp_path (Path): pytest-provided temporary directory for creating the DB file.
+
+    Raises:
+        AssertionError: If the configuration does not include an sqlite configuration.
+    """
+    # try to load the configuration containing SQLite database setup
+    configuration.load_configuration(configuration_filename_sqlite)
+    assert configuration.database_configuration.sqlite is not None
+
+    # we need to start each benchmark with empty database
+    configuration.database_configuration.sqlite.db_path = str(tmp_path / "database.db")
+
+    # initialize database session and create tables
+    database.initialize_database()
+    database.create_tables()
+
+
+def drop_postgres_tables(configuration: AppConfig) -> None:
+    """Drop postgres tables used by benchmarks.
+
+    The tables will be re-created so every benchmark start with fresh DB.
+    """
+
+    pgconfig = configuration.database_configuration.postgres
+    assert pgconfig is not None
+
+    # try to connect to Postgres
+    conn = psycopg2.connect(
+        database=pgconfig.db,
+        user=pgconfig.user,
+        password=pgconfig.password.get_secret_value(),
+        host=pgconfig.host,
+        port=pgconfig.port,
+    )
+
+    # try to drop tables used by benchmarks
+    try:
+        with conn.cursor() as cursor:
+            cursor.execute("DROP TABLE IF EXISTS user_turn;")
+            cursor.execute("DROP TABLE IF EXISTS user_conversation;")
+        conn.commit()
+    finally:
+        # closing the connection
+        conn.close()
+
+
+@pytest.fixture(name="postgres_database")
+def postgres_database_fixture(configuration_filename_postgres: str) -> None:
+    """Initialize a temporary postgres database for benchmarking.
+
+    This fixture:
+    - Loads the provided configuration file.
+    - Ensures an Postgres configuration is present.
+    - Initializes the DB engine and creates required tables.
+
+    Parameters:
+        configuration_filename_postgres (str): Path to the YAML configuration file to load.
+
+    Raises:
+        AssertionError: If the configuration does not include an postgres configuration.
+    """
+    # try to load the configuration containing postgres database setup
+    configuration.load_configuration(configuration_filename_postgres)
+    assert configuration.database_configuration.postgres is not None
+
+    # make sure all tables will be re-initialized
+    drop_postgres_tables(configuration)
+
+    # initialize database session and create tables
+    database.initialize_database()
+    database.create_tables()
diff --git a/tests/benchmarks/data_generators.py b/tests/benchmarks/data_generators.py
new file mode 100644
index 000000000..e39f1d6e7
--- /dev/null
+++ b/tests/benchmarks/data_generators.py
@@ -0,0 +1,159 @@
+"""Data generators used by benchmarks."""
+
+import random
+
+
+def generate_provider() -> str:
+    """Return a randomly chosen provider name.
+
+    The provider is selected from a predefined list of possible providers to
+    simulate different user conversation during benchmarks.
+
+    Returns:
+        str: Selected provider name.
+    """
+    providers = [
+        "openai",
+        "azure",
+        "vertexAI",
+        "watsonx",
+        "RHOAI (vLLM)",
+        "RHAIIS (vLLM)",
+        "RHEL AI (vLLM)",
+    ]
+    return random.choice(providers)
+
+
+def generate_model_for_provider(provider: str) -> str:
+    """Return a randomly chosen model ID for a given provider.
+
+    Parameters:
+        provider (str): Name of the provider for which to pick a model.
+
+    Returns:
+        str: A model identifier associated with the given provider. If the
+            provider is unknown, a fallback value of "foo" is returned.
+    """
+    models: dict[str, list[str]] = {
+        "openai": [
+            "gpt-5",
+            "gpt-5.2",
+            "gpt-5.2 pro",
+            "gpt-5 mini",
+            "gpt-4.1",
+            "gpt-4o",
+            "gpt-4-turbo",
+            "gpt-4.1 mini",
+            "gpt-4.1 nano",
+            "o4-mini",
+            "o1",
+            "o3",
+            "o4",
+        ],
+        "azure": [
+            "gpt-5",
+            "gpt-5-mini",
+            "gpt-5-nano",
+            "gpt-4.1",
+            "gpt-4.1 mini",
+            "gpt-5-chat",
+            "gpt-5.1",
+            "gpt-5.1-codex",
+            "gpt-5.2",
+            "gpt-5.2-chat",
+            "gpt-5.2-codex",
+            "claude-opus-4-5",
+            "claude-haiku-4-5",
+            "claude-sonnet-4-5",
+            "DeepSeek-v3.1",
+        ],
+        "vertexAI": [
+            "google/gemini-2.0-flash",
+            "google/gemini-2.5-flash",
+            "google/gemini-2.5-pro",
+        ],
+        "watsonx": [
+            "all-mini-l6-v2",
+            "multilingual-e5-large",
+            "granite-embedding-107m-multilingual",
+            "ibm-granite/granite-4.0-micro",
+            "ibm-granite/granite-4.0-micro-base",
+            "ibm-granite/granite-4.0-h-micro",
+            "ibm-granite/granite-4.0-h-micro-base",
+            "ibm-granite/granite-4.0-h-tiny",
+            "ibm-granite/granite-4.0-h-tiny-base",
+            "ibm-granite/granite-4.0-h-small",
+            "ibm-granite/granite-4.0-h-small-base",
+            "ibm-granite/granite-4.0-tiny-preview",
+            "ibm-granite/granite-4.0-tiny-base-preview",
+        ],
+        "RHOAI (vLLM)": ["meta-llama/Llama-3.2-1B-Instruct"],
+        "RHAIIS (vLLM)": ["meta-llama/Llama-3.1-8B-Instruct"],
+        "RHEL AI (vLLM)": ["meta-llama/Llama-3.1-8B-Instruct"],
+    }
+    return random.choice(models.get(provider, ["foo"]))
+
+
+def generate_topic_summary() -> str:
+    """Return a randomized topic summary string.
+
+    The summary is constructed by selecting one phrase from each of several
+    phrase groups to create varied but deterministic-looking summaries for the
+    test data.
+
+    Returns:
+        str: Generated summary sentence ending with a period.
+    """
+    yaps = [
+        [
+            "Soudruzi,",
+            "Na druhe strane",
+            "Stejne tak",
+            "Nesmime vsak zapominat, ze",
+            "Timto zpusobem",
+            "Zavaznost techto problemu je natolik zrejma, ze",
+            "Kazdodenni praxe nam potvrzuje, ze",
+            "Pestre a bohate zkusenosti",
+            "Poslani organizace, zejmena pak",
+            "Ideove uvahy nejvyssiho radu a rovnez",
+        ],
+        [
+            "realizace planovanych vytycenych ukolu",
+            "ramec a mista vychovy kadru",
+            "stabilni a kvantitativni vzrust a sfera nasi aktivity",
+            "vytvorena struktura organizace",
+            "novy model organizacni cinnosti",
+            "stale, informacne-propagandisticke zabezpeceni nasi prace",
+            "dalsi rozvoj ruznych forem cinnosti",
+            "upresneni a rozvoj struktur",
+            "konzultace se sirokym aktivem",
+            "pocatek kazdodenni prace na poli formovani pozice",
+        ],
+        [
+            "hraje zavaznou roli pri utvareni",
+            "vyzaduji od nas analyzy",
+            "vyzaduji nalezeni a jednoznacne upresneni",
+            "napomaha priprave a realizaci",
+            "zabezpecuje sirokemu okruhu specialistu ucast pri tvorbe",
+            "ve znacne mire podminuje vytvoreni",
+            "umoznuje splnit vyznamne ukoly na rozpracovani",
+            "umoznuje zhodnotit vyznam",
+            "predstavuje pozoruhodny experiment proverky",
+            "vyvolava proces zavadeni a modernizace",
+        ],
+        [
+            "existujicich financnich a administrativnich podminek",
+            "dalsich smeru rozvoje",
+            "systemu masove ucasti",
+            "pozic jednotlivych ucastniku k zadanym ukolum",
+            "novych navrhu",
+            "systemu vychovy kadru odpovidajicich aktualnim potrebam",
+            "smeru progresivniho rozvoje",
+            "odpovidajicich podminek aktivizace",
+            "modelu rozvoje",
+            "forem pusobeni",
+        ],
+    ]
+
+    summary = " ".join([random.choice(yap) for yap in yaps]) + "."
+    return summary
diff --git a/tests/benchmarks/db_benchmarks.py b/tests/benchmarks/db_benchmarks.py
new file mode 100644
index 000000000..b04ac91db
--- /dev/null
+++ b/tests/benchmarks/db_benchmarks.py
@@ -0,0 +1,334 @@
+"""Database benchmarks implementations."""
+
+from typing import Optional
+from sqlalchemy.orm import Session
+from datetime import UTC, datetime
+from pytest_benchmark.fixture import BenchmarkFixture
+
+from app.database import get_session
+from utils.suid import get_suid
+
+from models.database.conversations import UserConversation
+
+from .data_generators import (
+    generate_provider,
+    generate_model_for_provider,
+    generate_topic_summary,
+)
+
+
+def store_new_user_conversation(
+    session: Session, id: Optional[str] = None, user_id: Optional[str] = None
+) -> None:
+    """Store the new user conversation into database.
+
+    This helper constructs a UserConversation structure with randomized
+    provider/model and topic summary values and commits it into the provided
+    session.
+
+    Parameters:
+        session (Session): SQLAlchemy session used to persist the record.
+        id (Optional[str]): Optional explicit ID to assign to the new conversation.
+            If not provided, a generated suid will be used.
+        user_id (Optional[str]): Optional explicit user ID to assign to the new
+            conversation. If not provided, a generated suid will be used.
+
+    Returns:
+        None
+    """
+    provider = generate_provider()
+    model = generate_model_for_provider(provider)
+    topic_summary = generate_topic_summary()
+    conversation = UserConversation(
+        id=id or get_suid(),
+        user_id=user_id or get_suid(),
+        last_used_model=model,
+        last_used_provider=provider,
+        topic_summary=topic_summary,
+        last_message_at=datetime.now(UTC),
+        message_count=1,
+    )
+    session.add(conversation)
+    session.commit()
+
+
+def update_user_conversation(session: Session, id: str) -> None:
+    """Update existing conversation in the database.
+
+    This helper constructs a UserConversation structure with randomized
+    provider/model and topic summary values and commits it into the provided
+    session.
+
+    Parameters:
+        session (Session): SQLAlchemy session used to persist the record.
+        id (Optional[str]): Optional explicit ID to assign to the new conversation.
+            If not provided, a generated suid will be used.
+
+    Returns:
+        None
+    """
+    provider = generate_provider()
+    model = generate_model_for_provider(provider)
+    topic_summary = generate_topic_summary()
+
+    existing_conversation = session.query(UserConversation).filter_by(id=id).first()
+    assert existing_conversation is not None
+
+    existing_conversation.last_used_model = model
+    existing_conversation.last_used_provider = provider
+    existing_conversation.last_message_at = datetime.now(UTC)
+    existing_conversation.message_count += 1
+    existing_conversation.topic_summary = topic_summary
+    session.commit()
+
+
+def list_conversation_for_all_users(session: Session) -> None:
+    """Query and assert retrieval of all user conversations.
+
+    This helper queries all UserConversation records and asserts that the
+    result is a list (possibly empty). It is intended for use in a benchmark
+    that measures the listing performance.
+
+    Parameters:
+        session (Session): SQLAlchemy session used to query conversations.
+
+    Returns:
+        None
+    """
+    query = session.query(UserConversation)
+
+    user_conversations = query.all()
+    assert user_conversations is not None
+    assert len(user_conversations) >= 0
+
+
+def retrieve_conversation(
+    session: Session, conversation_id: str, should_be_none: bool
+) -> None:
+    """Query and assert retrieval of one conversation.
+
+    This helper function retrieves one given conversation from a database. It
+    is intended for use in a benchmark that measures the listing performance.
+
+    Parameters:
+        session (Session): SQLAlchemy session used to query conversations.
+
+    Returns:
+        None
+    """
+    query = session.query(UserConversation).filter_by(id=conversation_id)
+
+    conversation = query.first()
+    if should_be_none:
+        assert conversation is None
+    else:
+        assert conversation is not None
+
+
+def retrieve_conversation_for_one_user(
+    session: Session, user_id: str, conversation_id: str, should_be_none: bool
+) -> None:
+    """Query and assert retrieval of one conversation.
+
+    This helper function retrieves one given conversation from a database. It
+    is intended for use in a benchmark that measures the listing performance.
+
+    Parameters:
+        session (Session): SQLAlchemy session used to query conversations.
+
+    Returns:
+        None
+    """
+    query = session.query(UserConversation).filter_by(
+        id=conversation_id, user_id=user_id
+    )
+
+    conversation = query.first()
+    if should_be_none:
+        assert conversation is None
+    else:
+        assert conversation is not None
+
+
+def list_conversation_for_one_user(session: Session, user_id: str) -> None:
+    """Query and assert retrieval of one user conversation.
+
+    This helper queries all UserConversation records and asserts that the
+    result is a list (possibly empty). It is intended for use in a benchmark
+    that measures the listing performance.
+
+    Parameters:
+        session (Session): SQLAlchemy session used to query conversations.
+
+    Returns:
+        None
+    """
+    query = session.query(UserConversation).filter_by(user_id=user_id)
+
+    user_conversations = query.all()
+    assert user_conversations is not None
+    assert len(user_conversations) >= 0
+
+
+def benchmark_store_new_user_conversations(
+    benchmark: BenchmarkFixture, records_to_insert: int
+) -> None:
+    """Prepare DB and benchmark storing a single new conversation.
+
+    The database is pre-populated with ``records_to_insert`` records, then the
+    benchmark task stores one more conversation (using the helper above).
+
+    Parameters:
+        benchmark (BenchmarkFixture): pytest-benchmark fixture to run the measurement.
+        records_to_insert (int): Number of records to pre-populate before benchmarking.
+
+    Returns:
+        None
+    """
+    with get_session() as session:
+        # store bunch of conversations first
+        for id in range(records_to_insert):
+            store_new_user_conversation(session, str(id))
+        # then perform the benchmark
+        benchmark(store_new_user_conversation, session)
+
+
+def benchmark_update_user_conversation(
+    benchmark: BenchmarkFixture, records_to_insert: int
+) -> None:
+    """Prepare DB and benchmark updating a single existing conversation.
+
+    The database is pre-populated with ``records_to_insert`` records. Ensures
+    that a record with id "1234" exists (inserting it explicitly when needed)
+    and then benchmarks updating that conversation.
+
+    Parameters:
+        benchmark (BenchmarkFixture): pytest-benchmark fixture to run the measurement.
+        records_to_insert (int): Number of records to pre-populate before benchmarking.
+
+    Returns:
+        None
+    """
+    with get_session() as session:
+        # store bunch of conversations first
+        # Ensure record "1234" exists for the update benchmark.
+        # if records_to_insert <= 1234, range() won't include 1234, so insert it explicitly.
+        if records_to_insert <= 1234:
+            store_new_user_conversation(session, "1234")
+
+        # pre-populate database with records
+        for id in range(records_to_insert):
+            store_new_user_conversation(session, str(id))
+
+        # then perform the benchmark
+        benchmark(update_user_conversation, session, "1234")
+
+
+def benchmark_list_conversations_for_all_users(
+    benchmark: BenchmarkFixture, records_to_insert: int
+) -> None:
+    """Prepare DB and benchmark listing all conversations.
+
+    Pre-populates the DB with ``records_to_insert`` entries and benchmarks
+    the performance of querying and retrieving all UserConversation rows.
+
+    Parameters:
+        benchmark (BenchmarkFixture): pytest-benchmark fixture to run the measurement.
+        records_to_insert (int): Number of records to pre-populate before benchmarking.
+
+    Returns:
+        None
+    """
+    with get_session() as session:
+        # store bunch of conversations first
+        for id in range(records_to_insert):
+            store_new_user_conversation(session, str(id))
+        # then perform the benchmark
+        benchmark(list_conversation_for_all_users, session)
+
+
+def benchmark_list_conversations_for_one_user(
+    benchmark: BenchmarkFixture, records_to_insert: int
+) -> None:
+    """Prepare DB and benchmark listing all conversations.
+
+    Pre-populates the DB with ``records_to_insert`` entries and benchmarks
+    the performance of querying and retrieving all UserConversation rows.
+
+    Parameters:
+        benchmark (BenchmarkFixture): pytest-benchmark fixture to run the measurement.
+        records_to_insert (int): Number of records to pre-populate before benchmarking.
+
+    Returns:
+        None
+    """
+    with get_session() as session:
+        # store bunch of conversations first
+        for id in range(records_to_insert):
+            # use explicit conversation ID and also user ID
+            store_new_user_conversation(session, str(id), str(id))
+        # user ID somewhere in the middle of database
+        user_id = str(records_to_insert / 2)
+        # then perform the benchmark
+        benchmark(list_conversation_for_one_user, session, user_id)
+
+
+def benchmark_retrieve_conversation(
+    benchmark: BenchmarkFixture, records_to_insert: int
+) -> None:
+    """Prepare DB and benchmark retrieving one conversation.
+
+    Pre-populates the DB with ``records_to_insert`` entries and benchmarks
+    the performance of querying and retrieving one UserConversation record.
+
+    Parameters:
+        benchmark (BenchmarkFixture): pytest-benchmark fixture to run the measurement.
+        records_to_insert (int): Number of records to pre-populate before benchmarking.
+
+    Returns:
+        None
+    """
+    with get_session() as session:
+        # store bunch of conversations first
+        for id in range(records_to_insert):
+            # use explicit conversation ID and also user ID
+            store_new_user_conversation(session, str(id), str(id))
+        # user ID somewhere in the middle of database
+        conversation_id = str(records_to_insert // 2)
+        # then perform the benchmark
+        benchmark(
+            retrieve_conversation, session, conversation_id, records_to_insert == 0
+        )
+
+
+def benchmark_retrieve_conversation_for_one_user(
+    benchmark: BenchmarkFixture, records_to_insert: int
+) -> None:
+    """Prepare DB and benchmark retrieving one conversation.
+
+    Pre-populates the DB with ``records_to_insert`` entries and benchmarks
+    the performance of querying and retrieving one UserConversation record.
+
+    Parameters:
+        benchmark (BenchmarkFixture): pytest-benchmark fixture to run the measurement.
+        records_to_insert (int): Number of records to pre-populate before benchmarking.
+
+    Returns:
+        None
+    """
+    with get_session() as session:
+        # store bunch of conversations first
+        for id in range(records_to_insert):
+            # use explicit conversation ID and also user ID
+            store_new_user_conversation(session, str(id), str(id))
+        # user ID somewhere in the middle of database
+        user_id = str(records_to_insert // 2)
+        conversation_id = str(records_to_insert // 2)
+        # then perform the benchmark
+        benchmark(
+            retrieve_conversation_for_one_user,
+            session,
+            user_id,
+            conversation_id,
+            records_to_insert == 0,  # a flag whether records should be read
+        )
diff --git a/tests/benchmarks/test_app_database.py b/tests/benchmarks/test_app_database.py
index 6823d342a..4bb932ac2 100644
--- a/tests/benchmarks/test_app_database.py
+++ b/tests/benchmarks/test_app_database.py
@@ -1,20 +1,15 @@
 """Benchmarks for app.database module."""
 
-from typing import Optional
-from pathlib import Path
-import pytest
-import random
-from sqlalchemy.orm import Session
 from pytest_benchmark.fixture import BenchmarkFixture
-from datetime import UTC, datetime
 
-import psycopg2
-
-from app import database
-from app.database import get_session
-from configuration import configuration, AppConfig
-from utils.suid import get_suid
-from models.database.conversations import UserConversation
+from .db_benchmarks import (
+    benchmark_store_new_user_conversations,
+    benchmark_update_user_conversation,
+    benchmark_list_conversations_for_all_users,
+    benchmark_list_conversations_for_one_user,
+    benchmark_retrieve_conversation,
+    benchmark_retrieve_conversation_for_one_user,
+)
 
 # number of records to be stored in database before benchmarks
 SMALL_DB_RECORDS_COUNT = 100
@@ -22,449 +17,6 @@
 LARGE_DB_RECORDS_COUNT = 10000
 
 
-@pytest.fixture(name="configuration_filename_sqlite")
-def configuration_filename_sqlite_fixture() -> str:
-    """Retrieve configuration file name to be used by benchmarks.
-
-    Parameters:
-        None
-
-    Returns:
-        str: Path to the benchmark configuration file to load.
-    """
-    return "tests/configuration/benchmarks-sqlite.yaml"
-
-
-@pytest.fixture(name="configuration_filename_postgres")
-def configuration_filename_postgres_fixture() -> str:
-    """Retrieve configuration file name to be used by benchmarks.
-
-    Parameters:
-        None
-
-    Returns:
-        str: Path to the benchmark configuration file to load.
-    """
-    return "tests/configuration/benchmarks-postgres.yaml"
-
-
-@pytest.fixture(name="sqlite_database")
-def sqlite_database_fixture(configuration_filename_sqlite: str, tmp_path: Path) -> None:
-    """Initialize a temporary SQLite database for benchmarking.
-
-    This fixture:
-    - Loads the provided configuration file.
-    - Ensures an SQLite configuration is present.
-    - Uses a temp path for the SQLite DB file to guarantee a fresh DB for each run.
-    - Initializes the DB engine and creates required tables.
-
-    Parameters:
-        configuration_filename_sqlite (str): Path to the YAML configuration file to load.
-        tmp_path (Path): pytest-provided temporary directory for creating the DB file.
-
-    Raises:
-        AssertionError: If the configuration does not include an sqlite configuration.
-    """
-    # try to load the configuration containing SQLite database setup
-    configuration.load_configuration(configuration_filename_sqlite)
-    assert configuration.database_configuration.sqlite is not None
-
-    # we need to start each benchmark with empty database
-    configuration.database_configuration.sqlite.db_path = str(tmp_path / "database.db")
-
-    # initialize database session and create tables
-    database.initialize_database()
-    database.create_tables()
-
-
-def drop_postgres_tables(configuration: AppConfig) -> None:
-    """Drop postgres tables used by benchmarks.
-
-    The tables will be re-created so every benchmark start with fresh DB.
-    """
-
-    pgconfig = configuration.database_configuration.postgres
-    assert pgconfig is not None
-
-    # try to connect to Postgres
-    conn = psycopg2.connect(
-        database=pgconfig.db,
-        user=pgconfig.user,
-        password=pgconfig.password.get_secret_value(),
-        host=pgconfig.host,
-        port=pgconfig.port,
-    )
-
-    # try to drop tables used by benchmarks
-    try:
-        with conn.cursor() as cursor:
-            cursor.execute("DROP TABLE IF EXISTS user_turn;")
-            cursor.execute("DROP TABLE IF EXISTS user_conversation;")
-        conn.commit()
-    finally:
-        # closing the connection
-        conn.close()
-
-
-@pytest.fixture(name="postgres_database")
-def postgres_database_fixture(configuration_filename_postgres: str) -> None:
-    """Initialize a temporary postgres database for benchmarking.
-
-    This fixture:
-    - Loads the provided configuration file.
-    - Ensures an Postgres configuration is present.
-    - Initializes the DB engine and creates required tables.
-
-    Parameters:
-        configuration_filename_postgres (str): Path to the YAML configuration file to load.
-
-    Raises:
-        AssertionError: If the configuration does not include an postgres configuration.
-    """
-    # try to load the configuration containing postgres database setup
-    configuration.load_configuration(configuration_filename_postgres)
-    assert configuration.database_configuration.postgres is not None
-
-    # make sure all tables will be re-initialized
-    drop_postgres_tables(configuration)
-
-    # initialize database session and create tables
-    database.initialize_database()
-    database.create_tables()
-
-
-def generate_provider() -> str:
-    """Return a randomly chosen provider name.
-
-    The provider is selected from a predefined list of possible providers to
-    simulate different user conversation during benchmarks.
-
-    Returns:
-        str: Selected provider name.
-    """
-    providers = [
-        "openai",
-        "azure",
-        "vertexAI",
-        "watsonx",
-        "RHOAI (vLLM)",
-        "RHAIIS (vLLM)",
-        "RHEL AI (vLLM)",
-    ]
-    return random.choice(providers)
-
-
-def generate_model_for_provider(provider: str) -> str:
-    """Return a randomly chosen model ID for a given provider.
-
-    Parameters:
-        provider (str): Name of the provider for which to pick a model.
-
-    Returns:
-        str: A model identifier associated with the given provider. If the
-            provider is unknown, a fallback value of "foo" is returned.
-    """
-    models: dict[str, list[str]] = {
-        "openai": [
-            "gpt-5",
-            "gpt-5.2",
-            "gpt-5.2 pro",
-            "gpt-5 mini",
-            "gpt-4.1",
-            "gpt-4o",
-            "gpt-4-turbo",
-            "gpt-4.1 mini",
-            "gpt-4.1 nano",
-            "o4-mini",
-            "o1",
-            "o3",
-            "o4",
-        ],
-        "azure": [
-            "gpt-5",
-            "gpt-5-mini",
-            "gpt-5-nano",
-            "gpt-4.1",
-            "gpt-4.1 mini",
-            "gpt-5-chat",
-            "gpt-5.1",
-            "gpt-5.1-codex",
-            "gpt-5.2",
-            "gpt-5.2-chat",
-            "gpt-5.2-codex",
-            "claude-opus-4-5",
-            "claude-haiku-4-5",
-            "claude-sonnet-4-5",
-            "DeepSeek-v3.1",
-        ],
-        "vertexAI": [
-            "google/gemini-2.0-flash",
-            "google/gemini-2.5-flash",
-            "google/gemini-2.5-pro",
-        ],
-        "watsonx": [
-            "all-mini-l6-v2",
-            "multilingual-e5-large",
-            "granite-embedding-107m-multilingual",
-            "ibm-granite/granite-4.0-micro",
-            "ibm-granite/granite-4.0-micro-base",
-            "ibm-granite/granite-4.0-h-micro",
-            "ibm-granite/granite-4.0-h-micro-base",
-            "ibm-granite/granite-4.0-h-tiny",
-            "ibm-granite/granite-4.0-h-tiny-base",
-            "ibm-granite/granite-4.0-h-small",
-            "ibm-granite/granite-4.0-h-small-base",
-            "ibm-granite/granite-4.0-tiny-preview",
-            "ibm-granite/granite-4.0-tiny-base-preview",
-        ],
-        "RHOAI (vLLM)": ["meta-llama/Llama-3.2-1B-Instruct"],
-        "RHAIIS (vLLM)": ["meta-llama/Llama-3.1-8B-Instruct"],
-        "RHEL AI (vLLM)": ["meta-llama/Llama-3.1-8B-Instruct"],
-    }
-    return random.choice(models.get(provider, ["foo"]))
-
-
-def generate_topic_summary() -> str:
-    """Return a randomized topic summary string.
-
-    The summary is constructed by selecting one phrase from each of several
-    phrase groups to create varied but deterministic-looking summaries for the
-    test data.
-
-    Returns:
-        str: Generated summary sentence ending with a period.
-    """
-    yaps = [
-        [
-            "Soudruzi,",
-            "Na druhe strane",
-            "Stejne tak",
-            "Nesmime vsak zapominat, ze",
-            "Timto zpusobem",
-            "Zavaznost techto problemu je natolik zrejma, ze",
-            "Kazdodenni praxe nam potvrzuje, ze",
-            "Pestre a bohate zkusenosti",
-            "Poslani organizace, zejmena pak",
-            "Ideove uvahy nejvyssiho radu a rovnez",
-        ],
-        [
-            "realizace planovanych vytycenych ukolu",
-            "ramec a mista vychovy kadru",
-            "stabilni a kvantitativni vzrust a sfera nasi aktivity",
-            "vytvorena struktura organizace",
-            "novy model organizacni cinnosti",
-            "stale, informacne-propagandisticke zabezpeceni nasi prace",
-            "dalsi rozvoj ruznych forem cinnosti",
-            "upresneni a rozvoj struktur",
-            "konzultace se sirokym aktivem",
-            "pocatek kazdodenni prace na poli formovani pozice",
-        ],
-        [
-            "hraje zavaznou roli pri utvareni",
-            "vyzaduji od nas analyzy",
-            "vyzaduji nalezeni a jednoznacne upresneni",
-            "napomaha priprave a realizaci",
-            "zabezpecuje sirokemu okruhu specialistu ucast pri tvorbe",
-            "ve znacne mire podminuje vytvoreni",
-            "umoznuje splnit vyznamne ukoly na rozpracovani",
-            "umoznuje zhodnotit vyznam",
-            "predstavuje pozoruhodny experiment proverky",
-            "vyvolava proces zavadeni a modernizace",
-        ],
-        [
-            "existujicich financnich a administrativnich podminek",
-            "dalsich smeru rozvoje",
-            "systemu masove ucasti",
-            "pozic jednotlivych ucastniku k zadanym ukolum",
-            "novych navrhu",
-            "systemu vychovy kadru odpovidajicich aktualnim potrebam",
-            "smeru progresivniho rozvoje",
-            "odpovidajicich podminek aktivizace",
-            "modelu rozvoje",
-            "forem pusobeni",
-        ],
-    ]
-
-    summary = " ".join([random.choice(yap) for yap in yaps]) + "."
-    return summary
-
-
-def store_new_user_conversation(
-    session: Session, id: Optional[str] = None, user_id: Optional[str] = None
-) -> None:
-    """Store the new user conversation into database.
-
-    This helper constructs a UserConversation structure with randomized
-    provider/model and topic summary values and commits it into the provided
-    session.
-
-    Parameters:
-        session (Session): SQLAlchemy session used to persist the record.
-        id (Optional[str]): Optional explicit ID to assign to the new conversation.
-            If not provided, a generated suid will be used.
-        user_id (Optional[str]): Optional explicit user ID to assign to the new
-            conversation. If not provided, a generated suid will be used.
-
-    Returns:
-        None
-    """
-    provider = generate_provider()
-    model = generate_model_for_provider(provider)
-    topic_summary = generate_topic_summary()
-    conversation = UserConversation(
-        id=id or get_suid(),
-        user_id=user_id or get_suid(),
-        last_used_model=model,
-        last_used_provider=provider,
-        topic_summary=topic_summary,
-        last_message_at=datetime.now(UTC),
-        message_count=1,
-    )
-    session.add(conversation)
-    session.commit()
-
-
-def update_user_conversation(session: Session, id: str) -> None:
-    """Update existing conversation in the database.
-
-    This helper constructs a UserConversation structure with randomized
-    provider/model and topic summary values and commits it into the provided
-    session.
-
-    Parameters:
-        session (Session): SQLAlchemy session used to persist the record.
-        id (Optional[str]): Optional explicit ID to assign to the new conversation.
-            If not provided, a generated suid will be used.
-
-    Returns:
-        None
-    """
-    provider = generate_provider()
-    model = generate_model_for_provider(provider)
-    topic_summary = generate_topic_summary()
-
-    existing_conversation = session.query(UserConversation).filter_by(id=id).first()
-    assert existing_conversation is not None
-
-    existing_conversation.last_used_model = model
-    existing_conversation.last_used_provider = provider
-    existing_conversation.last_message_at = datetime.now(UTC)
-    existing_conversation.message_count += 1
-    existing_conversation.topic_summary = topic_summary
-    session.commit()
-
-
-def list_conversation_for_all_users(session: Session) -> None:
-    """Query and assert retrieval of all user conversations.
-
-    This helper queries all UserConversation records and asserts that the
-    result is a list (possibly empty). It is intended for use in a benchmark
-    that measures the listing performance.
-
-    Parameters:
-        session (Session): SQLAlchemy session used to query conversations.
-
-    Returns:
-        None
-    """
-    query = session.query(UserConversation)
-
-    user_conversations = query.all()
-    assert user_conversations is not None
-    assert len(user_conversations) >= 0
-
-
-def retrieve_conversation(
-    session: Session, conversation_id: str, should_be_none: bool
-) -> None:
-    """Query and assert retrieval of one conversation.
-
-    This helper function retrieves one given conversation from a database. It
-    is intended for use in a benchmark that measures the listing performance.
-
-    Parameters:
-        session (Session): SQLAlchemy session used to query conversations.
-
-    Returns:
-        None
-    """
-    query = session.query(UserConversation).filter_by(id=conversation_id)
-
-    conversation = query.first()
-    if should_be_none:
-        assert conversation is None
-    else:
-        assert conversation is not None
-
-
-def retrieve_conversation_for_one_user(
-    session: Session, user_id: str, conversation_id: str, should_be_none: bool
-) -> None:
-    """Query and assert retrieval of one conversation.
-
-    This helper function retrieves one given conversation from a database. It
-    is intended for use in a benchmark that measures the listing performance.
-
-    Parameters:
-        session (Session): SQLAlchemy session used to query conversations.
-
-    Returns:
-        None
-    """
-    query = session.query(UserConversation).filter_by(
-        id=conversation_id, user_id=user_id
-    )
-
-    conversation = query.first()
-    if should_be_none:
-        assert conversation is None
-    else:
-        assert conversation is not None
-
-
-def list_conversation_for_one_user(session: Session, user_id: str) -> None:
-    """Query and assert retrieval of one user conversation.
-
-    This helper queries all UserConversation records and asserts that the
-    result is a list (possibly empty). It is intended for use in a benchmark
-    that measures the listing performance.
-
-    Parameters:
-        session (Session): SQLAlchemy session used to query conversations.
-
-    Returns:
-        None
-    """
-    query = session.query(UserConversation).filter_by(user_id=user_id)
-
-    user_conversations = query.all()
-    assert user_conversations is not None
-    assert len(user_conversations) >= 0
-
-
-def benchmark_store_new_user_conversations(
-    benchmark: BenchmarkFixture, records_to_insert: int
-) -> None:
-    """Prepare DB and benchmark storing a single new conversation.
-
-    The database is pre-populated with ``records_to_insert`` records, then the
-    benchmark task stores one more conversation (using the helper above).
-
-    Parameters:
-        benchmark (BenchmarkFixture): pytest-benchmark fixture to run the measurement.
-        records_to_insert (int): Number of records to pre-populate before benchmarking.
-
-    Returns:
-        None
-    """
-    with get_session() as session:
-        # store bunch of conversations first
-        for id in range(records_to_insert):
-            store_new_user_conversation(session, str(id))
-        # then perform the benchmark
-        benchmark(store_new_user_conversation, session)
-
-
 def test_sqlite_store_new_user_conversations_empty_db(
     sqlite_database: None, benchmark: BenchmarkFixture
 ) -> None:
@@ -533,37 +85,6 @@ def test_sqlite_store_new_user_conversations_large_db(
     benchmark_store_new_user_conversations(benchmark, LARGE_DB_RECORDS_COUNT)
 
 
-def benchmark_update_user_conversation(
-    benchmark: BenchmarkFixture, records_to_insert: int
-) -> None:
-    """Prepare DB and benchmark updating a single existing conversation.
-
-    The database is pre-populated with ``records_to_insert`` records. Ensures
-    that a record with id "1234" exists (inserting it explicitly when needed)
-    and then benchmarks updating that conversation.
-
-    Parameters:
-        benchmark (BenchmarkFixture): pytest-benchmark fixture to run the measurement.
-        records_to_insert (int): Number of records to pre-populate before benchmarking.
-
-    Returns:
-        None
-    """
-    with get_session() as session:
-        # store bunch of conversations first
-        # Ensure record "1234" exists for the update benchmark.
-        # if records_to_insert <= 1234, range() won't include 1234, so insert it explicitly.
-        if records_to_insert <= 1234:
-            store_new_user_conversation(session, "1234")
-
-        # pre-populate database with records
-        for id in range(records_to_insert):
-            store_new_user_conversation(session, str(id))
-
-        # then perform the benchmark
-        benchmark(update_user_conversation, session, "1234")
-
-
 def test_sqlite_update_user_conversation_empty_db(
     sqlite_database: None,
     benchmark: BenchmarkFixture,
@@ -628,29 +149,6 @@ def test_sqlite_update_user_conversation_large_db(
     benchmark_update_user_conversation(benchmark, LARGE_DB_RECORDS_COUNT)
 
 
-def benchmark_list_conversations_for_all_users(
-    benchmark: BenchmarkFixture, records_to_insert: int
-) -> None:
-    """Prepare DB and benchmark listing all conversations.
-
-    Pre-populates the DB with ``records_to_insert`` entries and benchmarks
-    the performance of querying and retrieving all UserConversation rows.
-
-    Parameters:
-        benchmark (BenchmarkFixture): pytest-benchmark fixture to run the measurement.
-        records_to_insert (int): Number of records to pre-populate before benchmarking.
-
-    Returns:
-        None
-    """
-    with get_session() as session:
-        # store bunch of conversations first
-        for id in range(records_to_insert):
-            store_new_user_conversation(session, str(id))
-        # then perform the benchmark
-        benchmark(list_conversation_for_all_users, session)
-
-
 def test_sqlite_list_conversations_for_all_users_empty_db(
     sqlite_database: None, benchmark: BenchmarkFixture
 ) -> None:
@@ -711,32 +209,6 @@ def test_sqlite_list_conversations_for_all_users_large_db(
     benchmark_list_conversations_for_all_users(benchmark, LARGE_DB_RECORDS_COUNT)
 
 
-def benchmark_list_conversations_for_one_user(
-    benchmark: BenchmarkFixture, records_to_insert: int
-) -> None:
-    """Prepare DB and benchmark listing all conversations.
-
-    Pre-populates the DB with ``records_to_insert`` entries and benchmarks
-    the performance of querying and retrieving all UserConversation rows.
-
-    Parameters:
-        benchmark (BenchmarkFixture): pytest-benchmark fixture to run the measurement.
-        records_to_insert (int): Number of records to pre-populate before benchmarking.
-
-    Returns:
-        None
-    """
-    with get_session() as session:
-        # store bunch of conversations first
-        for id in range(records_to_insert):
-            # use explicit conversation ID and also user ID
-            store_new_user_conversation(session, str(id), str(id))
-        # user ID somewhere in the middle of database
-        user_id = str(records_to_insert / 2)
-        # then perform the benchmark
-        benchmark(list_conversation_for_one_user, session, user_id)
-
-
 def test_sqlite_list_conversations_for_one_user_empty_db(
     sqlite_database: None, benchmark: BenchmarkFixture
 ) -> None:
@@ -797,34 +269,6 @@ def test_sqlite_list_conversations_for_one_user_large_db(
     benchmark_list_conversations_for_one_user(benchmark, LARGE_DB_RECORDS_COUNT)
 
 
-def benchmark_retrieve_conversation(
-    benchmark: BenchmarkFixture, records_to_insert: int
-) -> None:
-    """Prepare DB and benchmark retrieving one conversation.
-
-    Pre-populates the DB with ``records_to_insert`` entries and benchmarks
-    the performance of querying and retrieving one UserConversation record.
-
-    Parameters:
-        benchmark (BenchmarkFixture): pytest-benchmark fixture to run the measurement.
-        records_to_insert (int): Number of records to pre-populate before benchmarking.
-
-    Returns:
-        None
-    """
-    with get_session() as session:
-        # store bunch of conversations first
-        for id in range(records_to_insert):
-            # use explicit conversation ID and also user ID
-            store_new_user_conversation(session, str(id), str(id))
-        # user ID somewhere in the middle of database
-        conversation_id = str(records_to_insert // 2)
-        # then perform the benchmark
-        benchmark(
-            retrieve_conversation, session, conversation_id, records_to_insert == 0
-        )
-
-
 def test_sqlite_retrieve_conversation_empty_db(
     sqlite_database: None, benchmark: BenchmarkFixture
 ) -> None:
@@ -885,39 +329,6 @@ def test_sqlite_retrieve_conversation_large_db(
     benchmark_retrieve_conversation(benchmark, LARGE_DB_RECORDS_COUNT)
 
 
-def benchmark_retrieve_conversation_for_one_user(
-    benchmark: BenchmarkFixture, records_to_insert: int
-) -> None:
-    """Prepare DB and benchmark retrieving one conversation.
-
-    Pre-populates the DB with ``records_to_insert`` entries and benchmarks
-    the performance of querying and retrieving one UserConversation record.
-
-    Parameters:
-        benchmark (BenchmarkFixture): pytest-benchmark fixture to run the measurement.
-        records_to_insert (int): Number of records to pre-populate before benchmarking.
-
-    Returns:
-        None
-    """
-    with get_session() as session:
-        # store bunch of conversations first
-        for id in range(records_to_insert):
-            # use explicit conversation ID and also user ID
-            store_new_user_conversation(session, str(id), str(id))
-        # user ID somewhere in the middle of database
-        user_id = str(records_to_insert // 2)
-        conversation_id = str(records_to_insert // 2)
-        # then perform the benchmark
-        benchmark(
-            retrieve_conversation_for_one_user,
-            session,
-            user_id,
-            conversation_id,
-            records_to_insert == 0,  # a flag whether records should be read
-        )
-
-
 def test_sqlite_retrieve_conversation_for_one_user_empty_db(
     sqlite_database: None, benchmark: BenchmarkFixture
 ) -> None:

From 88d0c924e864a7dff0c333ab94ba9eefa1eb42ed Mon Sep 17 00:00:00 2001
From: Pavel Tisnovsky <ptisnovs@redhat.com>
Date: Mon, 16 Feb 2026 11:11:15 +0100
Subject: [PATCH 2/2] Comparison benchmarks

---
 tests/benchmarks/conftest.py                  |   1 -
 .../test_app_database_comparison.py           | 132 ++++++++++++++++++
 2 files changed, 132 insertions(+), 1 deletion(-)
 create mode 100644 tests/benchmarks/test_app_database_comparison.py

diff --git a/tests/benchmarks/conftest.py b/tests/benchmarks/conftest.py
index 82a40b67d..267062c97 100644
--- a/tests/benchmarks/conftest.py
+++ b/tests/benchmarks/conftest.py
@@ -69,7 +69,6 @@ def drop_postgres_tables(configuration: AppConfig) -> None:
 
     The tables will be re-created so every benchmark start with fresh DB.
     """
-
     pgconfig = configuration.database_configuration.postgres
     assert pgconfig is not None
 
diff --git a/tests/benchmarks/test_app_database_comparison.py b/tests/benchmarks/test_app_database_comparison.py
new file mode 100644
index 000000000..4043e4a52
--- /dev/null
+++ b/tests/benchmarks/test_app_database_comparison.py
@@ -0,0 +1,132 @@
+"""Benchmarks to compare performances of SQLite and PostgreSQL databases."""
+
+import pytest
+from pytest_benchmark.fixture import BenchmarkFixture
+
+from .db_benchmarks import (
+    benchmark_store_new_user_conversations,
+    benchmark_update_user_conversation,
+    benchmark_list_conversations_for_all_users,
+    benchmark_list_conversations_for_one_user,
+    benchmark_retrieve_conversation,
+    benchmark_retrieve_conversation_for_one_user,
+)
+
+# number of records to be stored in database before benchmarks
+DB_RECORDS_COUNT = 100
+
+
+@pytest.mark.parametrize("db_fixture", ["sqlite_database", "postgres_database"])
+def test_store_new_user_conversations(
+    request: pytest.FixtureRequest,
+    db_fixture: str,
+    benchmark: BenchmarkFixture,
+) -> None:
+    """Benchmark for the DB operation to create and store new topic and conversation ID mapping.
+
+    Benchmark is performed against small DB.
+
+    Parameters:
+        sqlite_database: Fixture that prepares a temporary SQLite DB.
+        benchmark (BenchmarkFixture): pytest-benchmark fixture.
+
+    Returns:
+        None
+    """
+    request.getfixturevalue(db_fixture)
+    benchmark_store_new_user_conversations(benchmark, DB_RECORDS_COUNT)
+
+
+@pytest.mark.parametrize("db_fixture", ["sqlite_database", "postgres_database"])
+def test_update_user_conversation(
+    request: pytest.FixtureRequest,
+    db_fixture: str,
+    benchmark: BenchmarkFixture,
+) -> None:
+    """Benchmark updating conversation on small database.
+
+    Parameters:
+        sqlite_database: Fixture that prepares a temporary SQLite DB.
+        benchmark (BenchmarkFixture): pytest-benchmark fixture.
+
+    Returns:
+        None
+    """
+    request.getfixturevalue(db_fixture)
+    benchmark_update_user_conversation(benchmark, DB_RECORDS_COUNT)
+
+
+@pytest.mark.parametrize("db_fixture", ["sqlite_database", "postgres_database"])
+def test_list_conversations_for_all_users(
+    request: pytest.FixtureRequest,
+    db_fixture: str,
+    benchmark: BenchmarkFixture,
+) -> None:
+    """Benchmark listing conversations on small database.
+
+    Parameters:
+        sqlite_database: Fixture that prepares a temporary SQLite DB.
+        benchmark (BenchmarkFixture): pytest-benchmark fixture.
+
+    Returns:
+        None
+    """
+    request.getfixturevalue(db_fixture)
+    benchmark_list_conversations_for_all_users(benchmark, DB_RECORDS_COUNT)
+
+
+@pytest.mark.parametrize("db_fixture", ["sqlite_database", "postgres_database"])
+def test_list_conversations_for_one_user(
+    request: pytest.FixtureRequest,
+    db_fixture: str,
+    benchmark: BenchmarkFixture,
+) -> None:
+    """Benchmark listing conversations on an small database.
+
+    Parameters:
+        sqlite_database: Fixture that prepares a temporary SQLite DB.
+        benchmark (BenchmarkFixture): pytest-benchmark fixture.
+
+    Returns:
+        None
+    """
+    request.getfixturevalue(db_fixture)
+    benchmark_list_conversations_for_one_user(benchmark, DB_RECORDS_COUNT)
+
+
+@pytest.mark.parametrize("db_fixture", ["sqlite_database", "postgres_database"])
+def test_retrieve_conversation(
+    request: pytest.FixtureRequest,
+    db_fixture: str,
+    benchmark: BenchmarkFixture,
+) -> None:
+    """Benchmark retrieving conversations on a small database.
+
+    Parameters:
+        sqlite_database: Fixture that prepares a temporary SQLite DB.
+        benchmark (BenchmarkFixture): pytest-benchmark fixture.
+
+    Returns:
+        None
+    """
+    request.getfixturevalue(db_fixture)
+    benchmark_retrieve_conversation(benchmark, DB_RECORDS_COUNT)
+
+
+@pytest.mark.parametrize("db_fixture", ["sqlite_database", "postgres_database"])
+def test_retrieve_conversation_for_one_user(
+    request: pytest.FixtureRequest,
+    db_fixture: str,
+    benchmark: BenchmarkFixture,
+) -> None:
+    """Benchmark retrieving conversations on a small database.
+
+    Parameters:
+        sqlite_database: Fixture that prepares a temporary SQLite DB.
+        benchmark (BenchmarkFixture): pytest-benchmark fixture.
+
+    Returns:
+        None
+    """
+    request.getfixturevalue(db_fixture)
+    benchmark_retrieve_conversation_for_one_user(benchmark, DB_RECORDS_COUNT)