Use sync SQLAlchemy in Celery worker - fixes asyncpg connection issues
Build and push images / build-backend (push) Successful in 1m52s
Build and push images / build-worker (push) Successful in 44s
Build and push images / build-frontend (push) Successful in 25s

This commit is contained in:
2026-06-06 15:29:36 +01:00
parent 29c39c3bbb
commit c4e5eb91ed
3 changed files with 177 additions and 178 deletions
+16 -1
View File
@@ -1,7 +1,9 @@
from sqlalchemy.ext.asyncio import create_async_engine, AsyncSession, async_sessionmaker
from sqlalchemy.orm import DeclarativeBase
from sqlalchemy import create_engine
from sqlalchemy.orm import DeclarativeBase, sessionmaker
from app.core.config import settings
# Async engine for FastAPI
engine = create_async_engine(
settings.database_url,
echo=settings.environment == "development",
@@ -15,6 +17,19 @@ AsyncSessionLocal = async_sessionmaker(
expire_on_commit=False,
)
# Sync engine for Celery workers (Celery + asyncio don't mix well)
# Convert async URL to sync: postgresql+asyncpg:// → postgresql+psycopg2://
sync_url = settings.database_url.replace("postgresql+asyncpg://", "postgresql+psycopg2://")
sync_engine = create_engine(
sync_url,
echo=False,
pool_size=5,
max_overflow=10,
pool_pre_ping=True,
)
SyncSessionLocal = sessionmaker(sync_engine, expire_on_commit=False)
class Base(DeclarativeBase):
pass
+50 -67
View File
@@ -1,7 +1,10 @@
"""
Background tasks: activity ingestion, route matching, PR calculation.
Uses synchronous SQLAlchemy because Celery's prefork model doesn't play
well with asyncio - each worker process needs its own connection pool,
and async pools don't survive process forks.
"""
import asyncio
from celery import Celery
from app.core.config import settings
@@ -22,23 +25,14 @@ celery_app.conf.update(
)
def run_async(coro):
loop = asyncio.new_event_loop()
try:
return loop.run_until_complete(coro)
finally:
loop.close()
@celery_app.task(bind=True, name="process_activity_file")
def process_activity_file(self, file_path: str, user_id: int, source_type: str):
"""Parse a FIT/GPX file and insert activity + data points into DB."""
from app.services.fit_parser import parse_fit_file, parse_gpx_file, calculate_hr_zones
from app.services.route_matcher import compute_best_splits, routes_are_similar
from app.core.database import AsyncSessionLocal
from app.models.user import Activity, ActivityDataPoint, ActivityLap, PersonalRecord, HealthMetric
from app.core.database import SyncSessionLocal
from app.models.user import Activity, ActivityDataPoint, ActivityLap
from sqlalchemy import select
from datetime import datetime, timezone
from datetime import datetime
self.update_state(state="PROGRESS", meta={"step": "parsing"})
@@ -50,25 +44,22 @@ def process_activity_file(self, file_path: str, user_id: int, source_type: str):
except Exception as e:
raise self.retry(exc=e, countdown=10, max_retries=3)
async def _insert():
async with AsyncSessionLocal() as db:
with SyncSessionLocal() as db:
# Check for duplicate
if parsed.get("garmin_activity_id"):
existing = await db.execute(
existing = db.execute(
select(Activity).where(
Activity.garmin_activity_id == parsed["garmin_activity_id"]
)
)
if existing.scalar_one_or_none():
return None
).scalar_one_or_none()
if existing:
return {"activity_id": existing.id, "status": "duplicate"}
# HR zones
hr_zones = calculate_hr_zones(
parsed.get("data_points", []),
parsed.get("max_heart_rate") or 190
)
# Create activity
start_time = datetime.fromisoformat(parsed["start_time"]) if parsed.get("start_time") else None
activity = Activity(
@@ -97,17 +88,24 @@ def process_activity_file(self, file_path: str, user_id: int, source_type: str):
hr_zones=hr_zones,
)
db.add(activity)
await db.flush()
db.flush()
# Insert data points in batches
# Insert data points in batches - dedupe (activity_id, timestamp) pairs
# since composite PK rejects duplicates and Garmin sometimes has same-second readings
seen = set()
points = parsed.get("data_points", [])
batch_size = 500
for i in range(0, len(points), batch_size):
batch = points[i:i+batch_size]
db.add_all([
ActivityDataPoint(
batch = []
for p in points:
if not p.get("timestamp"):
continue
ts = datetime.fromisoformat(p["timestamp"]) if isinstance(p["timestamp"], str) else p["timestamp"]
key = (activity.id, ts)
if key in seen:
continue
seen.add(key)
batch.append(ActivityDataPoint(
activity_id=activity.id,
timestamp=datetime.fromisoformat(p["timestamp"]) if p.get("timestamp") else None,
timestamp=ts,
latitude=p.get("latitude"),
longitude=p.get("longitude"),
altitude_m=p.get("altitude_m"),
@@ -117,11 +115,16 @@ def process_activity_file(self, file_path: str, user_id: int, source_type: str):
power=p.get("power"),
temperature_c=p.get("temperature_c"),
distance_m=p.get("distance_m"),
)
for p in batch
])
))
if len(batch) >= 500:
db.add_all(batch)
db.flush()
batch = []
if batch:
db.add_all(batch)
db.flush()
# Insert laps
# Laps
for lap in parsed.get("laps", []):
ls = datetime.fromisoformat(lap["start_time"]) if lap.get("start_time") else None
db.add(ActivityLap(
@@ -136,15 +139,11 @@ def process_activity_file(self, file_path: str, user_id: int, source_type: str):
avg_power=lap.get("avg_power"),
))
await db.commit()
return activity.id
db.commit()
activity_id = activity.id
activity_id = run_async(_insert())
if activity_id:
# Queue PR calculation
compute_personal_records.delay(activity_id, user_id, parsed)
return {"activity_id": activity_id, "status": "ok"}
@@ -152,7 +151,7 @@ def process_activity_file(self, file_path: str, user_id: int, source_type: str):
def compute_personal_records(activity_id: int, user_id: int, parsed: dict):
"""Calculate personal records for standard distances from this activity."""
from app.services.route_matcher import compute_best_splits, STANDARD_DISTANCES
from app.core.database import AsyncSessionLocal
from app.core.database import SyncSessionLocal
from app.models.user import PersonalRecord
from sqlalchemy import select
from datetime import datetime, timezone
@@ -165,23 +164,20 @@ def compute_personal_records(activity_id: int, user_id: int, parsed: dict):
best_splits = compute_best_splits(data_points, total_dist)
async def _save():
async with AsyncSessionLocal() as db:
with SyncSessionLocal() as db:
for label, duration_s in best_splits.items():
dist_m = next((d for d, l in STANDARD_DISTANCES if l == label), None)
if dist_m is None:
continue
# Check existing record
existing = await db.execute(
current = db.execute(
select(PersonalRecord).where(
PersonalRecord.user_id == user_id,
PersonalRecord.sport_type == sport,
PersonalRecord.distance_m == dist_m,
PersonalRecord.is_current_record == True,
)
)
current = existing.scalar_one_or_none()
).scalar_one_or_none()
if current is None or duration_s < current.duration_s:
if current:
@@ -196,34 +192,23 @@ def compute_personal_records(activity_id: int, user_id: int, parsed: dict):
achieved_at=start_time,
is_current_record=True,
))
await db.commit()
run_async(_save())
db.commit()
@celery_app.task(name="process_garmin_health_zip")
def process_garmin_health_zip(zip_path: str, user_id: int):
"""
Process a Garmin Connect data export zip.
Extracts wellness/sleep/HRV CSV files and inserts health metrics.
"""
"""Extract wellness/sleep/HRV data from a Garmin Connect export ZIP."""
import zipfile
import json
import csv
from pathlib import Path
from app.core.database import AsyncSessionLocal
from app.core.database import SyncSessionLocal
from app.models.user import HealthMetric
from sqlalchemy.dialects.postgresql import insert
from datetime import datetime, timezone
async def _process():
async with AsyncSessionLocal() as db:
with SyncSessionLocal() as db:
with zipfile.ZipFile(zip_path) as zf:
names = zf.namelist()
# Parse daily summary JSON files from Garmin export
for name in names:
if "DailyMetrics" in name and name.endswith(".json"):
for name in zf.namelist():
if "DailyMetrics" not in name or not name.endswith(".json"):
continue
with zf.open(name) as f:
try:
data = json.load(f)
@@ -252,6 +237,4 @@ def process_garmin_health_zip(zip_path: str, user_id: int):
)
db.add(metric)
await db.commit()
run_async(_process())
db.commit()
+1
View File
@@ -22,3 +22,4 @@ Pillow==10.3.0
aiofiles==23.2.1
python-dateutil==2.9.0
pytz==2024.1
psycopg2-binary==2.9.9