diff --git a/Dockerfile b/Dockerfile index 9d9dcca..c427aa5 100644 --- a/Dockerfile +++ b/Dockerfile @@ -13,6 +13,8 @@ WORKDIR /app COPY requirements.txt . RUN pip install --no-cache-dir -r requirements.txt +ENV PYTHONPATH=/app + COPY backend/ backend/ COPY alembic/ alembic/ COPY alembic.ini . diff --git a/Dockerfile.worker b/Dockerfile.worker index 14d085a..d2c568d 100644 --- a/Dockerfile.worker +++ b/Dockerfile.worker @@ -4,6 +4,8 @@ WORKDIR /app COPY requirements.txt . RUN pip install --no-cache-dir -r requirements.txt +ENV PYTHONPATH=/app + COPY backend/ backend/ COPY alembic/ alembic/ COPY alembic.ini . diff --git a/alembic/versions/001_initial.py b/alembic/versions/001_initial.py new file mode 100644 index 0000000..780e6fa --- /dev/null +++ b/alembic/versions/001_initial.py @@ -0,0 +1,171 @@ +"""initial schema + +Revision ID: 001 +Revises: +Create Date: 2026-03-09 +""" +from alembic import op +import sqlalchemy as sa + +revision = "001" +down_revision = None +branch_labels = None +depends_on = None + + +def upgrade() -> None: + op.create_table( + "monitored_subreddits", + sa.Column("id", sa.Integer(), primary_key=True), + sa.Column("name", sa.String(255), unique=True, nullable=False), + sa.Column("display_name", sa.String(255), nullable=True), + sa.Column("description", sa.String(), nullable=True), + sa.Column("subscribers", sa.Integer(), nullable=True), + sa.Column("is_active", sa.Boolean(), server_default="true", nullable=False), + sa.Column("created_at", sa.DateTime(timezone=True), nullable=False), + sa.Column("updated_at", sa.DateTime(timezone=True), nullable=False), + ) + + op.create_table( + "authors", + sa.Column("id", sa.Integer(), primary_key=True), + sa.Column("username", sa.String(255), unique=True, nullable=False), + sa.Column("first_seen_at", sa.DateTime(timezone=True), nullable=False), + sa.Column("last_seen_at", sa.DateTime(timezone=True), nullable=False), + sa.Column("total_posts", sa.Integer(), server_default="0", nullable=False), + sa.Column("total_comments", sa.Integer(), server_default="0", nullable=False), + ) + + op.create_table( + "posts", + sa.Column("id", sa.Integer(), primary_key=True), + sa.Column("reddit_id", sa.String(20), unique=True, nullable=False), + sa.Column( + "subreddit_id", + sa.Integer(), + sa.ForeignKey("monitored_subreddits.id"), + nullable=False, + index=True, + ), + sa.Column( + "author_id", + sa.Integer(), + sa.ForeignKey("authors.id"), + nullable=True, + index=True, + ), + sa.Column("title", sa.String(), nullable=False), + sa.Column("selftext", sa.String(), nullable=True), + sa.Column("url", sa.String(), nullable=True), + sa.Column("permalink", sa.String(), nullable=True), + sa.Column("flair", sa.String(255), nullable=True), + sa.Column("score", sa.Integer(), server_default="0", nullable=False, index=True), + sa.Column("upvote_ratio", sa.Float(), nullable=True), + sa.Column("num_comments", sa.Integer(), server_default="0", nullable=False), + sa.Column("is_self", sa.Boolean(), nullable=True), + sa.Column("over_18", sa.Boolean(), server_default="false", nullable=False), + sa.Column("hot_rank", sa.Integer(), nullable=True), + sa.Column("created_utc", sa.DateTime(timezone=True), nullable=False), + sa.Column("collected_at", sa.DateTime(timezone=True), nullable=False), + sa.Column("updated_at", sa.DateTime(timezone=True), nullable=False), + ) + op.create_index( + "ix_posts_subreddit_created", "posts", ["subreddit_id", "created_utc"] + ) + + op.create_table( + "comments", + sa.Column("id", sa.Integer(), primary_key=True), + sa.Column("reddit_id", sa.String(20), unique=True, nullable=False), + sa.Column( + "post_id", + sa.Integer(), + sa.ForeignKey("posts.id"), + nullable=False, + index=True, + ), + sa.Column( + "parent_comment_id", + sa.Integer(), + sa.ForeignKey("comments.id"), + nullable=True, + index=True, + ), + sa.Column( + "author_id", + sa.Integer(), + sa.ForeignKey("authors.id"), + nullable=True, + index=True, + ), + sa.Column("body", sa.String(), nullable=False), + sa.Column("score", sa.Integer(), server_default="0", nullable=False), + sa.Column("created_utc", sa.DateTime(timezone=True), nullable=False), + sa.Column("collected_at", sa.DateTime(timezone=True), nullable=False), + sa.Column("updated_at", sa.DateTime(timezone=True), nullable=False), + ) + + op.create_table( + "metric_snapshots", + sa.Column("id", sa.Integer(), primary_key=True), + sa.Column( + "post_id", + sa.Integer(), + sa.ForeignKey("posts.id"), + nullable=False, + ), + sa.Column("score", sa.Integer(), nullable=False), + sa.Column("num_comments", sa.Integer(), nullable=False), + sa.Column("upvote_ratio", sa.Float(), nullable=True), + sa.Column("snapshot_at", sa.DateTime(timezone=True), nullable=False), + ) + op.create_index( + "ix_metric_snapshots_post_snapshot", + "metric_snapshots", + ["post_id", "snapshot_at"], + ) + + op.create_table( + "daily_digests", + sa.Column("id", sa.Integer(), primary_key=True), + sa.Column( + "subreddit_id", + sa.Integer(), + sa.ForeignKey("monitored_subreddits.id"), + nullable=False, + ), + sa.Column("digest_date", sa.Date(), nullable=False), + sa.Column("content", sa.String(), nullable=False), + sa.Column("metadata", sa.JSON(), nullable=True), + sa.Column("generated_at", sa.DateTime(timezone=True), nullable=False), + ) + + op.create_table( + "summaries", + sa.Column("id", sa.Integer(), primary_key=True), + sa.Column( + "subreddit_id", + sa.Integer(), + sa.ForeignKey("monitored_subreddits.id"), + nullable=False, + ), + sa.Column("summary_type", sa.String(50), nullable=False), + sa.Column("content", sa.String(), nullable=True), + sa.Column("metadata", sa.JSON(), nullable=True), + sa.Column("period_start", sa.DateTime(timezone=True), nullable=True), + sa.Column("period_end", sa.DateTime(timezone=True), nullable=True), + sa.Column("provider", sa.String(100), nullable=True), + sa.Column("generated_at", sa.DateTime(timezone=True), nullable=False), + ) + + +def downgrade() -> None: + op.drop_table("summaries") + op.drop_table("daily_digests") + op.drop_index("ix_metric_snapshots_post_snapshot", table_name="metric_snapshots") + op.drop_table("metric_snapshots") + op.drop_table("comments") + op.drop_index("ix_posts_subreddit_created", table_name="posts") + op.drop_table("posts") + op.drop_table("authors") + op.drop_table("monitored_subreddits")