feat: log presence, read receipts, group leaves, links, profiles, stories

This commit is contained in:
h
2026-05-29 22:13:59 +02:00
parent bfd16ab02c
commit bcb94b6474
31 changed files with 1298 additions and 19 deletions
@@ -0,0 +1,155 @@
"""phase8 profiles groups stories links
Revision ID: a1d4f7c2e9b8
Revises: f3a8d1c5b7e2
Create Date: 2026-05-29 22:10:00.000000
"""
from collections.abc import Sequence
import sqlalchemy as sa
from alembic import op
from sqlalchemy.dialects import postgresql
revision: str = "a1d4f7c2e9b8"
down_revision: str | None = "f3a8d1c5b7e2"
branch_labels: str | Sequence[str] | None = None
depends_on: str | Sequence[str] | None = None
def upgrade() -> None:
op.create_table(
"peers",
sa.Column("account_id", sa.Integer(), nullable=False),
sa.Column("peer_id", sa.BigInteger(), nullable=False),
sa.Column("first_name", sa.String(), nullable=True),
sa.Column("last_name", sa.String(), nullable=True),
sa.Column("username", sa.String(), nullable=True),
sa.Column("phone", sa.String(), nullable=True),
sa.Column("photo_unique_id", sa.String(), nullable=True),
sa.Column("is_deleted_account", sa.Boolean(), nullable=False),
sa.Column("raw", postgresql.JSONB(astext_type=sa.Text()), nullable=False),
sa.Column(
"updated_at",
sa.DateTime(timezone=True),
server_default=sa.text("now()"),
nullable=False,
),
sa.PrimaryKeyConstraint("account_id", "peer_id"),
)
op.create_table(
"peer_history",
sa.Column("account_id", sa.Integer(), nullable=False),
sa.Column("peer_id", sa.BigInteger(), nullable=False),
sa.Column("observed_at", sa.DateTime(timezone=True), nullable=False),
sa.Column("first_name", sa.String(), nullable=True),
sa.Column("last_name", sa.String(), nullable=True),
sa.Column("username", sa.String(), nullable=True),
sa.Column("phone", sa.String(), nullable=True),
sa.Column("photo_unique_id", sa.String(), nullable=True),
sa.Column("is_deleted_account", sa.Boolean(), nullable=False),
sa.Column("raw", postgresql.JSONB(astext_type=sa.Text()), nullable=False),
sa.PrimaryKeyConstraint("account_id", "peer_id", "observed_at"),
)
op.create_table(
"avatars",
sa.Column("id", sa.BigInteger(), autoincrement=True, nullable=False),
sa.Column("account_id", sa.Integer(), nullable=False),
sa.Column("owner_id", sa.BigInteger(), nullable=False),
sa.Column("owner_kind", sa.String(), nullable=False),
sa.Column("unique_id", sa.String(), nullable=False),
sa.Column("storage_key", sa.String(), nullable=True),
sa.Column("file_size", sa.BigInteger(), nullable=True),
sa.Column("mime", sa.String(), nullable=True),
sa.Column("downloaded", sa.Boolean(), nullable=False),
sa.Column("raw", postgresql.JSONB(astext_type=sa.Text()), nullable=False),
sa.Column(
"first_seen_at",
sa.DateTime(timezone=True),
server_default=sa.text("now()"),
nullable=False,
),
sa.PrimaryKeyConstraint("id"),
sa.UniqueConstraint("account_id", "owner_id", "unique_id"),
)
op.create_table(
"chat_history",
sa.Column("account_id", sa.Integer(), nullable=False),
sa.Column("chat_id", sa.BigInteger(), nullable=False),
sa.Column("message_id", sa.BigInteger(), nullable=False),
sa.Column("event", sa.String(), nullable=False),
sa.Column("title", sa.String(), nullable=True),
sa.Column("photo_unique_id", sa.String(), nullable=True),
sa.Column("actor_id", sa.BigInteger(), nullable=True),
sa.Column("ts", sa.DateTime(timezone=True), nullable=False),
sa.Column("raw", postgresql.JSONB(astext_type=sa.Text()), nullable=False),
sa.PrimaryKeyConstraint("account_id", "chat_id", "message_id"),
)
op.create_table(
"memberships",
sa.Column("account_id", sa.Integer(), nullable=False),
sa.Column("chat_id", sa.BigInteger(), nullable=False),
sa.Column("message_id", sa.BigInteger(), nullable=False),
sa.Column("user_id", sa.BigInteger(), nullable=False),
sa.Column("event", sa.String(), nullable=False),
sa.Column("actor_id", sa.BigInteger(), nullable=True),
sa.Column("ts", sa.DateTime(timezone=True), nullable=False),
sa.Column("raw", postgresql.JSONB(astext_type=sa.Text()), nullable=False),
sa.PrimaryKeyConstraint("account_id", "chat_id", "message_id", "user_id"),
)
op.create_table(
"stories",
sa.Column("account_id", sa.Integer(), nullable=False),
sa.Column("peer_id", sa.BigInteger(), nullable=False),
sa.Column("story_id", sa.BigInteger(), nullable=False),
sa.Column("date", sa.DateTime(timezone=True), nullable=True),
sa.Column("expire_date", sa.DateTime(timezone=True), nullable=True),
sa.Column("caption", sa.String(), nullable=True),
sa.Column("media_kind", sa.String(), nullable=True),
sa.Column("storage_key", sa.String(), nullable=True),
sa.Column("file_size", sa.BigInteger(), nullable=True),
sa.Column("downloaded", sa.Boolean(), nullable=False),
sa.Column("views", sa.Integer(), nullable=True),
sa.Column("pinned", sa.Boolean(), nullable=False),
sa.Column("deleted", sa.Boolean(), nullable=False),
sa.Column("raw", postgresql.JSONB(astext_type=sa.Text()), nullable=False),
sa.Column(
"observed_at",
sa.DateTime(timezone=True),
server_default=sa.text("now()"),
nullable=False,
),
sa.PrimaryKeyConstraint("account_id", "peer_id", "story_id"),
)
op.create_table(
"links",
sa.Column("account_id", sa.Integer(), nullable=False),
sa.Column("chat_id", sa.BigInteger(), nullable=False),
sa.Column("message_id", sa.BigInteger(), nullable=False),
sa.Column("position", sa.Integer(), nullable=False),
sa.Column("url", sa.String(), nullable=False),
sa.Column("kind", sa.String(), nullable=False),
sa.Column("web_url", sa.String(), nullable=True),
sa.Column("web_title", sa.String(), nullable=True),
sa.Column("web_description", sa.String(), nullable=True),
sa.Column("web_site_name", sa.String(), nullable=True),
sa.Column("raw", postgresql.JSONB(astext_type=sa.Text()), nullable=False),
sa.PrimaryKeyConstraint("account_id", "chat_id", "message_id", "position"),
)
def downgrade() -> None:
op.drop_table("links")
op.drop_table("stories")
op.drop_table("memberships")
op.drop_table("chat_history")
op.drop_table("avatars")
op.drop_table("peer_history")
op.drop_table("peers")
@@ -0,0 +1,67 @@
"""presence hypertable
Revision ID: e5c1f0a72b9d
Revises: d4b9f2e6a1c7
Create Date: 2026-05-29 21:00:00.000000
"""
from collections.abc import Sequence
import sqlalchemy as sa
from alembic import op
from sqlalchemy.dialects import postgresql
revision: str = "e5c1f0a72b9d"
down_revision: str | None = "d4b9f2e6a1c7"
branch_labels: str | Sequence[str] | None = None
depends_on: str | Sequence[str] | None = None
def upgrade() -> None:
op.create_table(
"presence",
sa.Column("account_id", sa.Integer(), nullable=False),
sa.Column("peer_id", sa.BigInteger(), nullable=False),
sa.Column("ts", sa.DateTime(timezone=True), nullable=False),
sa.Column("status", sa.String(), nullable=False),
sa.Column("last_online_date", sa.DateTime(timezone=True), nullable=True),
sa.Column("next_offline_date", sa.DateTime(timezone=True), nullable=True),
sa.Column("raw", postgresql.JSONB(astext_type=sa.Text()), nullable=False),
sa.PrimaryKeyConstraint("account_id", "peer_id", "ts"),
)
op.execute(
"SELECT create_hypertable('presence', by_range('ts', INTERVAL '1 week'))"
)
op.execute(
"ALTER TABLE presence SET ("
"timescaledb.enable_columnstore = true, "
"timescaledb.segmentby = 'peer_id', "
"timescaledb.orderby = 'ts DESC')"
)
op.execute("CALL add_columnstore_policy('presence', after => INTERVAL '30 days')")
op.execute(
"CREATE MATERIALIZED VIEW presence_hourly "
"WITH (timescaledb.continuous) AS "
"SELECT time_bucket('1 hour', ts) AS bucket, "
"account_id, peer_id, "
"count(*) AS samples, "
"count(*) FILTER (WHERE status = 'online') AS online_samples, "
"max(ts) AS last_seen "
"FROM presence "
"GROUP BY bucket, account_id, peer_id "
"WITH NO DATA"
)
op.execute(
"SELECT add_continuous_aggregate_policy('presence_hourly', "
"start_offset => INTERVAL '3 hours', "
"end_offset => INTERVAL '1 hour', "
"schedule_interval => INTERVAL '1 hour')"
)
def downgrade() -> None:
op.execute("DROP MATERIALIZED VIEW IF EXISTS presence_hourly")
op.drop_table("presence")
@@ -0,0 +1,49 @@
"""read_receipts hypertable
Revision ID: f3a8d1c5b7e2
Revises: e5c1f0a72b9d
Create Date: 2026-05-29 21:30:00.000000
"""
from collections.abc import Sequence
import sqlalchemy as sa
from alembic import op
from sqlalchemy.dialects import postgresql
revision: str = "f3a8d1c5b7e2"
down_revision: str | None = "e5c1f0a72b9d"
branch_labels: str | Sequence[str] | None = None
depends_on: str | Sequence[str] | None = None
def upgrade() -> None:
op.create_table(
"read_receipts",
sa.Column("account_id", sa.Integer(), nullable=False),
sa.Column("chat_id", sa.BigInteger(), nullable=False),
sa.Column("reader_id", sa.BigInteger(), nullable=False),
sa.Column("ts", sa.DateTime(timezone=True), nullable=False),
sa.Column("kind", sa.String(), nullable=False),
sa.Column("message_id", sa.BigInteger(), nullable=False),
sa.Column("raw", postgresql.JSONB(astext_type=sa.Text()), nullable=False),
sa.PrimaryKeyConstraint("account_id", "chat_id", "message_id", "ts"),
)
op.execute(
"SELECT create_hypertable('read_receipts', by_range('ts', INTERVAL '1 week'))"
)
op.execute(
"ALTER TABLE read_receipts SET ("
"timescaledb.enable_columnstore = true, "
"timescaledb.segmentby = 'chat_id', "
"timescaledb.orderby = 'ts DESC')"
)
op.execute(
"CALL add_columnstore_policy('read_receipts', after => INTERVAL '30 days')"
)
def downgrade() -> None:
op.drop_table("read_receipts")