WIP: wrote a query to get domains ordered by number of reported paths

This commit is contained in:
Jack Case
2025-11-24 18:59:22 +00:00
parent a36b6e9865
commit fcc5d9d7bc

View File

@@ -1,7 +1,7 @@
from collections.abc import Iterable
from datetime import datetime
from urllib.parse import ParseResult
from sqlalchemy import select
from sqlalchemy import select, func
from sqlalchemy.engine import Engine
from sqlalchemy.orm import Session
from slopserver.models import Domain, Path, User, Report
@@ -12,6 +12,10 @@ def select_slop(urls: list[ParseResult], engine: Engine) -> Iterable[Domain]:
rows = session.scalars(query).all()
return rows
def top_offenders(limit: int|None = None, engine: Engine) -> Iterable[Domain]:
query = select(Domain).join(Path).group_by(Domain.id).order_by(func.count(Path.id).desc())
top_offenders
def insert_slop(urls: list[ParseResult], engine: Engine, user: User | None = None):
domain_dict: dict[str. set[str]] = dict()
for url in urls: