Skip to content

Commit

Permalink
Use special "deleted" journalist for associations with deleted users
Browse files Browse the repository at this point in the history
Currently when a journalist is deleted, most referential tables are
updated with `journalist_id=NULL`, forcing all clients to accomodate
that case. Instead, we are now going to either re-associate those rows
with a special "deleted" journalist account, or delete them outright.
All journalist_id columns are now NOT NULL to enforce this.

Tables with rows migrated to "deleted":
* replies
* seen_files
* seen_messages
* seen_replies

Tables with rows that are deleted outright:
* journalist_login_attempt
* revoked_tokens

The "deleted" journalist account is a real account that exists in the
database, but cannot be logged into and has no passphase set. It is not
possible to delete it nor is it shown in the admin listing of
journalists. It is lazily created on demand using a special
DeletedJournalist subclass that bypasses username and passphrase
validation.

Journalist objects must now be deleted by calling the new delete()
function on them. Trying to directly `db.session.delete(journalist)`
will most likely fail with an Exception because of rows that weren't
migrated first.

The migration step looks for any existing rows in those tables with
journalist_id=NULL and either migrates them to "deleted" or deletes
them. Then all the columns are changed to be NOT NULL.

Fixes #6192.
  • Loading branch information
legoktm committed Jan 14, 2022
1 parent 4f6259f commit 312106a
Show file tree
Hide file tree
Showing 8 changed files with 380 additions and 28 deletions.
Original file line number Diff line number Diff line change
@@ -0,0 +1,128 @@
"""make journalist_id non-nullable
Revision ID: 2e24fc7536e8
Revises: de00920916bf
Create Date: 2022-01-12 19:31:06.186285
"""
import uuid

from alembic import op
import sqlalchemy as sa

# revision identifiers, used by Alembic.
revision = '2e24fc7536e8'
down_revision = 'de00920916bf'
branch_labels = None
depends_on = None


def create_deleted() -> int:
"""manually insert a "deleted" journalist user.
We need to do it this way since the model will reflect the current state of
the schema, not what it is at the current migration step
It should be basically identical to what DeletedJournalist.get() does
"""
op.execute(sa.text(
"""\
INSERT INTO journalists (uuid, username, session_nonce)
VALUES (:uuid, "deleted", 0);
"""
).bindparams(uuid=str(uuid.uuid4())))
# Get the autoincrement ID back
conn = op.get_bind()
result = conn.execute('SELECT id FROM journalists WHERE username="deleted";').fetchall()
return result[0][0]


def migrate_nulls():
"""migrate existing journalist_id=NULL over to deleted or delete them"""
op.execute("DELETE FROM journalist_login_attempt WHERE journalist_id IS NULL;")
op.execute("DELETE FROM revoked_tokens WHERE journalist_id IS NULL;")
# Look to see if we have data to migrate
tables = ('replies', 'seen_files', 'seen_messages', 'seen_replies')
needs_migration = []
conn = op.get_bind()
for table in tables:
result = conn.execute(f'SELECT 1 FROM {table} WHERE journalist_id IS NULL;').first() # nosec
if result is not None:
needs_migration.append(table)

if not needs_migration:
return

deleted_id = create_deleted()
for table in needs_migration:
op.execute(sa.text(
f'UPDATE {table} SET journalist_id=:journalist_id WHERE journalist_id IS NULL;'
).bindparams(journalist_id=deleted_id))


def upgrade():
migrate_nulls()

with op.batch_alter_table('journalist_login_attempt', schema=None) as batch_op:
batch_op.alter_column('journalist_id',
existing_type=sa.INTEGER(),
nullable=False)

with op.batch_alter_table('replies', schema=None) as batch_op:
batch_op.alter_column('journalist_id',
existing_type=sa.INTEGER(),
nullable=False)

with op.batch_alter_table('revoked_tokens', schema=None) as batch_op:
batch_op.alter_column('journalist_id',
existing_type=sa.INTEGER(),
nullable=False)

with op.batch_alter_table('seen_files', schema=None) as batch_op:
batch_op.alter_column('journalist_id',
existing_type=sa.INTEGER(),
nullable=False)

with op.batch_alter_table('seen_messages', schema=None) as batch_op:
batch_op.alter_column('journalist_id',
existing_type=sa.INTEGER(),
nullable=False)

with op.batch_alter_table('seen_replies', schema=None) as batch_op:
batch_op.alter_column('journalist_id',
existing_type=sa.INTEGER(),
nullable=False)


def downgrade():
# We do not un-migrate the data back to journalist_id=NULL

with op.batch_alter_table('seen_replies', schema=None) as batch_op:
batch_op.alter_column('journalist_id',
existing_type=sa.INTEGER(),
nullable=True)

with op.batch_alter_table('seen_messages', schema=None) as batch_op:
batch_op.alter_column('journalist_id',
existing_type=sa.INTEGER(),
nullable=True)

with op.batch_alter_table('seen_files', schema=None) as batch_op:
batch_op.alter_column('journalist_id',
existing_type=sa.INTEGER(),
nullable=True)

with op.batch_alter_table('revoked_tokens', schema=None) as batch_op:
batch_op.alter_column('journalist_id',
existing_type=sa.INTEGER(),
nullable=True)

with op.batch_alter_table('replies', schema=None) as batch_op:
batch_op.alter_column('journalist_id',
existing_type=sa.INTEGER(),
nullable=True)

with op.batch_alter_table('journalist_login_attempt', schema=None) as batch_op:
batch_op.alter_column('journalist_id',
existing_type=sa.INTEGER(),
nullable=True)
20 changes: 13 additions & 7 deletions securedrop/journalist_app/admin.py
Original file line number Diff line number Diff line change
Expand Up @@ -30,7 +30,7 @@ def make_blueprint(config: SDConfig) -> Blueprint:
@view.route('/', methods=('GET', 'POST'))
@admin_required
def index() -> str:
users = Journalist.query.all()
users = Journalist.query.filter(Journalist.username != "deleted").all()
return render_template("admin.html", users=users)

@view.route('/config', methods=('GET', 'POST'))
Expand Down Expand Up @@ -288,16 +288,22 @@ def delete_user(user_id: int) -> werkzeug.Response:
current_app.logger.error(
"Admin {} tried to delete itself".format(g.user.username))
abort(403)
elif user:
db.session.delete(user)
db.session.commit()
flash(gettext("Deleted user '{user}'.").format(
user=user.username), "notification")
else:
elif not user:
current_app.logger.error(
"Admin {} tried to delete nonexistent user with pk={}".format(
g.user.username, user_id))
abort(404)
elif user.username == "deleted":
# Do not flash because the interface does not expose this.
# It can only happen by manually crafting a POST request
current_app.logger.error(
"Admin {} tried to delete \"deleted\" user".format(g.user.username))
abort(403)
else:
user.delete()
db.session.commit()
flash(gettext("Deleted user '{user}'.").format(
user=user.username), "notification")

return redirect(url_for('admin.index'))

Expand Down
2 changes: 1 addition & 1 deletion securedrop/loaddata.py
Original file line number Diff line number Diff line change
Expand Up @@ -382,7 +382,7 @@ def load(args: argparse.Namespace) -> None:

# delete one journalist
_, _, journalist_to_be_deleted = journalists
db.session.delete(journalist_to_be_deleted)
journalist_to_be_deleted.delete()
db.session.commit()


Expand Down
84 changes: 67 additions & 17 deletions securedrop/models.py
Original file line number Diff line number Diff line change
Expand Up @@ -2,6 +2,7 @@
import binascii
import datetime
import base64
import itertools
import os
import pyotp
import qrcode
Expand Down Expand Up @@ -254,7 +255,7 @@ class Reply(db.Model):
id = Column(Integer, primary_key=True)
uuid = Column(String(36), unique=True, nullable=False)

journalist_id = Column(Integer, ForeignKey('journalists.id'))
journalist_id = Column(Integer, ForeignKey('journalists.id'), nullable=False)
journalist = relationship(
"Journalist",
backref=backref(
Expand Down Expand Up @@ -294,18 +295,16 @@ def __repr__(self) -> str:
return '<Reply %r>' % (self.filename)

def to_json(self) -> 'Dict[str, Any]':
journalist_username = "deleted"
journalist_first_name = ""
journalist_last_name = ""
journalist_uuid = "deleted"
if self.journalist:
journalist_username = self.journalist.username
journalist_first_name = self.journalist.first_name
journalist_last_name = self.journalist.last_name
journalist_username = self.journalist.username
journalist_first_name = self.journalist.first_name or ""
journalist_last_name = self.journalist.last_name or ""
if journalist_username == "deleted":
# special-case the "deleted" user
journalist_uuid = "deleted"
else:
journalist_uuid = self.journalist.uuid
seen_by = [
r.journalist.uuid for r in SeenReply.query.filter(SeenReply.reply_id == self.id)
if r.journalist
]
json_reply = {
'source_url': url_for('api.single_source',
Expand Down Expand Up @@ -434,10 +433,17 @@ class Journalist(db.Model):
) # type: Column[Optional[datetime.datetime]]
last_access = Column(DateTime) # type: Column[Optional[datetime.datetime]]
passphrase_hash = Column(String(256)) # type: Column[Optional[str]]

login_attempts = relationship(
"JournalistLoginAttempt",
backref="journalist"
backref="journalist",
cascade="all, delete"
) # type: RelationshipProperty[JournalistLoginAttempt]
revoked_tokens = relationship(
"RevokedToken",
backref="journalist",
cascade="all, delete"
) # type: RelationshipProperty[RevokedToken]

MIN_USERNAME_LEN = 3
MIN_NAME_LEN = 0
Expand All @@ -446,7 +452,7 @@ class Journalist(db.Model):

def __init__(self,
username: str,
password: str,
password: 'Optional[str]',
first_name: 'Optional[str]' = None,
last_name: 'Optional[str]' = None,
is_admin: bool = False,
Expand Down Expand Up @@ -784,13 +790,57 @@ def to_json(self, all_info: bool = True) -> Dict[str, Any]:

return json_user

def delete(self) -> None:
"""delete a journalist, migrating some data over to the "deleted" journalist
Callers must commit the session themselves
"""
deleted = DeletedJournalist.get()
# All the rows that should be reassociated with the "deleted" journalist
reassociate = itertools.chain(
Reply.query.filter_by(journalist_id=self.id).all(),
SeenFile.query.filter_by(journalist_id=self.id).all(),
SeenMessage.query.filter_by(journalist_id=self.id).all(),
SeenReply.query.filter_by(journalist_id=self.id).all()
)
for obj in reassociate:
obj.journalist_id = deleted.id
db.session.add(obj)

# For the rest of the associated data we rely on cascading deletions
db.session.delete(self)


class DeletedJournalist(Journalist):
"""A system user that represents deleted journalists for referential integrity"""
def __init__(self) -> None:
super().__init__(username='deleted', password=None)

@staticmethod
def get() -> 'Journalist':
deleted = Journalist.query.filter_by(username='deleted').one_or_none()
if deleted is None:
# Lazily create
deleted = DeletedJournalist()
db.session.add(deleted)
return deleted

@classmethod
def check_username_acceptable(cls, username: str) -> None:
"""override parent to disable this check"""
return None

def set_password(self, passphrase: 'Optional[str]') -> None:
"""override parent to disable this, we set no password"""
return None


class SeenFile(db.Model):
__tablename__ = "seen_files"
__table_args__ = (db.UniqueConstraint("file_id", "journalist_id"),)
id = Column(Integer, primary_key=True)
file_id = Column(Integer, ForeignKey("submissions.id"), nullable=False)
journalist_id = Column(Integer, ForeignKey("journalists.id"), nullable=True)
journalist_id = Column(Integer, ForeignKey("journalists.id"), nullable=False)
file = relationship(
"Submission", backref=backref("seen_files", lazy="dynamic", cascade="all,delete")
) # type: RelationshipProperty[Submission]
Expand All @@ -804,7 +854,7 @@ class SeenMessage(db.Model):
__table_args__ = (db.UniqueConstraint("message_id", "journalist_id"),)
id = Column(Integer, primary_key=True)
message_id = Column(Integer, ForeignKey("submissions.id"), nullable=False)
journalist_id = Column(Integer, ForeignKey("journalists.id"), nullable=True)
journalist_id = Column(Integer, ForeignKey("journalists.id"), nullable=False)
message = relationship(
"Submission", backref=backref("seen_messages", lazy="dynamic", cascade="all,delete")
) # type: RelationshipProperty[Submission]
Expand All @@ -818,7 +868,7 @@ class SeenReply(db.Model):
__table_args__ = (db.UniqueConstraint("reply_id", "journalist_id"),)
id = Column(Integer, primary_key=True)
reply_id = Column(Integer, ForeignKey("replies.id"), nullable=False)
journalist_id = Column(Integer, ForeignKey("journalists.id"), nullable=True)
journalist_id = Column(Integer, ForeignKey("journalists.id"), nullable=False)
reply = relationship(
"Reply", backref=backref("seen_replies", cascade="all,delete")
) # type: RelationshipProperty[Reply]
Expand All @@ -838,7 +888,7 @@ class JournalistLoginAttempt(db.Model):
DateTime,
default=datetime.datetime.utcnow
) # type: Column[Optional[datetime.datetime]]
journalist_id = Column(Integer, ForeignKey('journalists.id'))
journalist_id = Column(Integer, ForeignKey('journalists.id'), nullable=False)

def __init__(self, journalist: Journalist) -> None:
self.journalist = journalist
Expand All @@ -853,7 +903,7 @@ class RevokedToken(db.Model):
__tablename__ = 'revoked_tokens'

id = Column(Integer, primary_key=True)
journalist_id = Column(Integer, ForeignKey('journalists.id'))
journalist_id = Column(Integer, ForeignKey('journalists.id'), nullable=False)
token = db.Column(db.Text, nullable=False, unique=True)


Expand Down
Loading

0 comments on commit 312106a

Please sign in to comment.