Skip to content
Snippets Groups Projects
Verified Commit 0796ac6c authored by Antoine R. Dumont's avatar Antoine R. Dumont
Browse files

Move SWHDatabaseJanitor to db.pytest_plugin module

parent a7d1aa7b
No related branches found
No related tags found
1 merge request!179Move SWHDatabaseJanitor to db.pytest_plugin module
......@@ -4,17 +4,12 @@
# See top-level LICENSE file for more information
import functools
import glob
import logging
import re
import subprocess
from typing import Optional, Set, Union
from typing import Optional, Union
import psycopg2
import psycopg2.extensions
from pytest_postgresql.janitor import DatabaseJanitor, Version
from swh.core.utils import numfile_sortkey as sortkey
logger = logging.getLogger(__name__)
......@@ -255,112 +250,3 @@ def execute_values_generator(cur, sql, argslist, template=None, page_size=100):
parts[-1:] = post
cur.execute(b"".join(parts))
yield from cur
class SWHDatabaseJanitor(DatabaseJanitor):
"""SWH database janitor implementation with a a different setup/teardown policy than
than the stock one. Instead of dropping, creating and initializing the database for
each test, it creates and initializes the db once, then truncates the tables (and
sequences) in between tests.
This is needed to have acceptable test performances.
"""
def __init__(
self,
user: str,
host: str,
port: str,
db_name: str,
version: Union[str, float, Version],
dump_files: Optional[str] = None,
no_truncate_tables: Set[str] = set(),
) -> None:
super().__init__(user, host, port, db_name, version)
if dump_files:
self.dump_files = sorted(glob.glob(dump_files), key=sortkey)
else:
self.dump_files = []
# do no truncate the following tables
self.no_truncate_tables = set(no_truncate_tables)
def db_setup(self):
conninfo = (
f"host={self.host} user={self.user} port={self.port} dbname={self.db_name}"
)
for fname in self.dump_files:
subprocess.check_call(
[
"psql",
"--quiet",
"--no-psqlrc",
"-v",
"ON_ERROR_STOP=1",
"-d",
conninfo,
"-f",
fname,
]
)
def db_reset(self):
"""Truncate tables (all but self.no_truncate_tables set) and sequences
"""
with psycopg2.connect(
dbname=self.db_name, user=self.user, host=self.host, port=self.port,
) as cnx:
with cnx.cursor() as cur:
cur.execute(
"SELECT table_name FROM information_schema.tables "
"WHERE table_schema = %s",
("public",),
)
all_tables = set(table for (table,) in cur.fetchall())
tables_to_truncate = all_tables - self.no_truncate_tables
for table in tables_to_truncate:
cur.execute("TRUNCATE TABLE %s CASCADE" % table)
cur.execute(
"SELECT sequence_name FROM information_schema.sequences "
"WHERE sequence_schema = %s",
("public",),
)
seqs = set(seq for (seq,) in cur.fetchall())
for seq in seqs:
cur.execute("ALTER SEQUENCE %s RESTART;" % seq)
cnx.commit()
def init(self):
"""Initialize db. Create the db if it does not exist. Reset it if it exists."""
with self.cursor() as cur:
cur.execute(
"SELECT COUNT(1) FROM pg_database WHERE datname=%s;", (self.db_name,)
)
db_exists = cur.fetchone()[0] == 1
if db_exists:
cur.execute(
"UPDATE pg_database SET datallowconn=true WHERE datname = %s;",
(self.db_name,),
)
self.db_reset()
return
# initialize the inexistent db
with self.cursor() as cur:
cur.execute('CREATE DATABASE "{}";'.format(self.db_name))
self.db_setup()
def drop(self):
"""The original DatabaseJanitor implementation prevents new connections from happening,
destroys current opened connections and finally drops the database.
We actually do not want to drop the db so we instead do nothing and resets
(truncate most tables and sequences) the db instead, in order to have some
acceptable performance.
"""
pass
......@@ -3,18 +3,130 @@
# License: GNU General Public License version 3, or any later version
# See top-level LICENSE file for more information
import glob
import logging
from typing import Optional, Set
import subprocess
from typing import Optional, Set, Union
import psycopg2
import pytest
from pytest_postgresql import factories
from pytest_postgresql.janitor import DatabaseJanitor, Version
from swh.core.db.db_utils import SWHDatabaseJanitor
from swh.core.utils import numfile_sortkey as sortkey
logger = logging.getLogger(__name__)
class SWHDatabaseJanitor(DatabaseJanitor):
"""SWH database janitor implementation with a a different setup/teardown policy than
than the stock one. Instead of dropping, creating and initializing the database for
each test, it creates and initializes the db once, then truncates the tables (and
sequences) in between tests.
This is needed to have acceptable test performances.
"""
def __init__(
self,
user: str,
host: str,
port: str,
db_name: str,
version: Union[str, float, Version],
dump_files: Optional[str] = None,
no_truncate_tables: Set[str] = set(),
) -> None:
super().__init__(user, host, port, db_name, version)
if dump_files:
self.dump_files = sorted(glob.glob(dump_files), key=sortkey)
else:
self.dump_files = []
# do no truncate the following tables
self.no_truncate_tables = set(no_truncate_tables)
def db_setup(self):
conninfo = (
f"host={self.host} user={self.user} port={self.port} dbname={self.db_name}"
)
for fname in self.dump_files:
subprocess.check_call(
[
"psql",
"--quiet",
"--no-psqlrc",
"-v",
"ON_ERROR_STOP=1",
"-d",
conninfo,
"-f",
fname,
]
)
def db_reset(self):
"""Truncate tables (all but self.no_truncate_tables set) and sequences
"""
with psycopg2.connect(
dbname=self.db_name, user=self.user, host=self.host, port=self.port,
) as cnx:
with cnx.cursor() as cur:
cur.execute(
"SELECT table_name FROM information_schema.tables "
"WHERE table_schema = %s",
("public",),
)
all_tables = set(table for (table,) in cur.fetchall())
tables_to_truncate = all_tables - self.no_truncate_tables
for table in tables_to_truncate:
cur.execute("TRUNCATE TABLE %s CASCADE" % table)
cur.execute(
"SELECT sequence_name FROM information_schema.sequences "
"WHERE sequence_schema = %s",
("public",),
)
seqs = set(seq for (seq,) in cur.fetchall())
for seq in seqs:
cur.execute("ALTER SEQUENCE %s RESTART;" % seq)
cnx.commit()
def init(self):
"""Initialize db. Create the db if it does not exist. Reset it if it exists."""
with self.cursor() as cur:
cur.execute(
"SELECT COUNT(1) FROM pg_database WHERE datname=%s;", (self.db_name,)
)
db_exists = cur.fetchone()[0] == 1
if db_exists:
cur.execute(
"UPDATE pg_database SET datallowconn=true WHERE datname = %s;",
(self.db_name,),
)
self.db_reset()
return
# initialize the inexistent db
with self.cursor() as cur:
cur.execute('CREATE DATABASE "{}";'.format(self.db_name))
self.db_setup()
def drop(self):
"""The original DatabaseJanitor implementation prevents new connections from happening,
destroys current opened connections and finally drops the database.
We actually do not want to drop the db so we instead do nothing and resets
(truncate most tables and sequences) the db instead, in order to have some
acceptable performance.
"""
pass
# the postgres_fact factory fixture below is mostly a copy of the code
# from pytest-postgresql. We need a custom version here to be able to
# specify our version of the DBJanitor we use.
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment