-
Notifications
You must be signed in to change notification settings - Fork 42
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Merge pull request #1162 from freedomofpress/1149_data_migration
add data migration testing and fix journalist association in replies table
- Loading branch information
Showing
5 changed files
with
334 additions
and
0 deletions.
There are no files selected for viewing
56 changes: 56 additions & 0 deletions
56
alembic/versions/a4bf1f58ce69_fix_journalist_association_in_replies.py
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,56 @@ | ||
"""fix journalist association in replies table | ||
Revision ID: a4bf1f58ce69 | ||
Revises: 7f682532afa2 | ||
Create Date: 2020-10-20 13:49:53.035383 | ||
""" | ||
from alembic import op | ||
|
||
|
||
# revision identifiers, used by Alembic. | ||
revision = 'a4bf1f58ce69' | ||
down_revision = '7f682532afa2' | ||
branch_labels = None | ||
depends_on = None | ||
|
||
|
||
def upgrade(): | ||
""" | ||
Fix reply association with journalist by updating journalist uuid to journalist id in the | ||
journalist_id column. | ||
""" | ||
conn = op.get_bind() | ||
cursor = conn.execute(""" | ||
SELECT journalist_id | ||
FROM replies, users | ||
WHERE journalist_id=users.uuid; | ||
""") | ||
|
||
replies_with_incorrect_associations = cursor.fetchall() | ||
if not replies_with_incorrect_associations: | ||
return | ||
|
||
conn.execute(""" | ||
UPDATE replies | ||
SET journalist_id= | ||
( | ||
SELECT users.id | ||
FROM users | ||
WHERE journalist_id=users.uuid | ||
) | ||
WHERE exists | ||
( | ||
SELECT users.id | ||
FROM users | ||
WHERE journalist_id=users.uuid | ||
); | ||
""") | ||
|
||
|
||
def downgrade(): | ||
""" | ||
We do not want to undo this bug fix, because nothing will break if we downgrade to an earlier | ||
version of the client. | ||
""" | ||
pass |
Empty file.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,89 @@ | ||
# -*- coding: utf-8 -*- | ||
|
||
import os | ||
import random | ||
import subprocess | ||
|
||
from securedrop_client import db | ||
from securedrop_client.db import Reply, User | ||
|
||
from .utils import add_reply, add_source, add_user | ||
|
||
random.seed("=^..^=..^=..^=") | ||
|
||
|
||
class UpgradeTester: | ||
""" | ||
Verify that upgrading to the target migration results in the replacement of uuid with id of the | ||
user in the replies table's journalist_id column. | ||
""" | ||
|
||
NUM_USERS = 20 | ||
NUM_SOURCES = 20 | ||
NUM_REPLIES = 40 | ||
|
||
def __init__(self, homedir): | ||
subprocess.check_call(["sqlite3", os.path.join(homedir, "svs.sqlite"), ".databases"]) | ||
self.session = db.make_session_maker(homedir)() | ||
|
||
def load_data(self): | ||
""" | ||
Load data that has the bug where user.uuid is stored in replies.journalist_id. | ||
""" | ||
for _ in range(self.NUM_SOURCES): | ||
add_source(self.session) | ||
|
||
self.session.commit() | ||
|
||
for i in range(self.NUM_USERS): | ||
if i == 0: | ||
# As of this migration, the server tells the client that the associated journalist | ||
# of a reply has been deleted by returning "deleted" as the uuid of the associated | ||
# journalist. This gets stored as the jouranlist_id in the replies table. | ||
# | ||
# Make sure to test this case as well. | ||
add_user(self.session, "deleted") | ||
source_id = random.randint(1, self.NUM_SOURCES) | ||
add_reply(self.session, "deleted", source_id) | ||
else: | ||
add_user(self.session) | ||
|
||
self.session.commit() | ||
|
||
# Add replies from randomly-selected journalists to a randomly-selected sources | ||
for _ in range(1, self.NUM_REPLIES): | ||
journalist_id = random.randint(1, self.NUM_USERS) | ||
journalist = self.session.query(User).filter_by(id=journalist_id).one() | ||
source_id = random.randint(1, self.NUM_SOURCES) | ||
add_reply(self.session, journalist.uuid, source_id) | ||
|
||
self.session.commit() | ||
|
||
def check_upgrade(self): | ||
""" | ||
Make sure each reply in the replies table has the correct journalist_id stored for the | ||
associated journalist by making sure a User account exists with that journalist id. | ||
""" | ||
replies = self.session.query(Reply).all() | ||
assert len(replies) | ||
|
||
for reply in replies: | ||
# Will fail if User does not exist | ||
self.session.query(User).filter_by(id=reply.journalist_id).one() | ||
|
||
self.session.close() | ||
|
||
|
||
class DowngradeTester: | ||
""" | ||
Nothing to test since the downgrade path doesn't do anything. | ||
""" | ||
|
||
def __init__(self, homedir): | ||
pass | ||
|
||
def load_data(self): | ||
pass | ||
|
||
def check_downgrade(self): | ||
pass |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,154 @@ | ||
# -*- coding: utf-8 -*- | ||
import random | ||
import string | ||
from datetime import datetime | ||
from typing import Optional | ||
from uuid import uuid4 | ||
|
||
from sqlalchemy import text | ||
from sqlalchemy.orm.session import Session | ||
|
||
from securedrop_client.db import DownloadError, Source | ||
|
||
random.seed("ᕕ( ᐛ )ᕗ") | ||
|
||
|
||
def random_bool() -> bool: | ||
return bool(random.getrandbits(1)) | ||
|
||
|
||
def bool_or_none() -> Optional[bool]: | ||
return random.choice([None, True, False]) | ||
|
||
|
||
def random_name() -> str: | ||
len = random.randint(1, 100) | ||
return random_chars(len) | ||
|
||
|
||
def random_username() -> str: | ||
len = random.randint(3, 64) | ||
return random_chars(len) | ||
|
||
|
||
def random_chars(len: int, chars: str = string.printable) -> str: | ||
return "".join([random.choice(chars) for _ in range(len)]) | ||
|
||
|
||
def random_ascii_chars(len: int, chars: str = string.ascii_lowercase): | ||
return "".join([random.choice(chars) for _ in range(len)]) | ||
|
||
|
||
def random_datetime(nullable: bool = False): | ||
if nullable and random_bool(): | ||
return None | ||
else: | ||
return datetime( | ||
year=random.randint(1, 9999), | ||
month=random.randint(1, 12), | ||
day=random.randint(1, 28), | ||
hour=random.randint(0, 23), | ||
minute=random.randint(0, 59), | ||
second=random.randint(0, 59), | ||
microsecond=random.randint(0, 1000), | ||
) | ||
|
||
|
||
def add_source(session: Session) -> None: | ||
params = { | ||
"uuid": str(uuid4()), | ||
"journalist_designation": random_chars(50), | ||
"last_updated": random_datetime(nullable=True), | ||
"interaction_count": random.randint(0, 1000), | ||
} | ||
sql = """ | ||
INSERT INTO sources ( | ||
uuid, | ||
journalist_designation, | ||
last_updated, | ||
interaction_count | ||
) | ||
VALUES ( | ||
:uuid, | ||
:journalist_designation, | ||
:last_updated, | ||
:interaction_count | ||
) | ||
""" | ||
session.execute(text(sql), params) | ||
|
||
|
||
def add_user(session: Session, uuid: Optional[str] = None) -> None: | ||
if not uuid: | ||
journalist_uuid = str(uuid4()) | ||
else: | ||
journalist_uuid = uuid | ||
|
||
params = { | ||
"uuid": journalist_uuid, | ||
"username": random_username(), | ||
} | ||
sql = """ | ||
INSERT INTO users (uuid, username) | ||
VALUES (:uuid, :username) | ||
""" | ||
session.execute(text(sql), params) | ||
|
||
|
||
def add_reply(session: Session, journalist_id: int, source_id: int) -> None: | ||
is_downloaded = random_bool() if random_bool() else None | ||
is_decrypted = random_bool() if is_downloaded else None | ||
|
||
download_errors = session.query(DownloadError).all() | ||
download_error_ids = [error.id for error in download_errors] | ||
|
||
content = random_chars(1000) if is_downloaded else None | ||
|
||
source = session.query(Source).filter_by(id=source_id).one() | ||
|
||
file_counter = len(source.collection) + 1 | ||
|
||
params = { | ||
"uuid": str(uuid4()), | ||
"journalist_id": journalist_id, | ||
"source_id": source_id, | ||
"filename": random_chars(50) + "-reply.gpg", | ||
"file_counter": file_counter, | ||
"size": random.randint(0, 1024 * 1024 * 500), | ||
"content": content, | ||
"is_downloaded": is_downloaded, | ||
"is_decrypted": is_decrypted, | ||
"download_error_id": random.choice(download_error_ids), | ||
"last_updated": random_datetime(), | ||
} | ||
sql = """ | ||
INSERT INTO replies | ||
( | ||
uuid, | ||
journalist_id, | ||
source_id, | ||
filename, | ||
file_counter, | ||
size, | ||
content, | ||
is_downloaded, | ||
is_decrypted, | ||
download_error_id, | ||
last_updated | ||
) | ||
VALUES | ||
( | ||
:uuid, | ||
:journalist_id, | ||
:source_id, | ||
:filename, | ||
:file_counter, | ||
:size, | ||
:content, | ||
:is_downloaded, | ||
:is_decrypted, | ||
:download_error_id, | ||
:last_updated | ||
) | ||
""" | ||
session.execute(text(sql), params) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters