CCRI-POPROX · karlhigley · Sep 6, 2024 · Sep 3, 2024 · Sep 3, 2024 · Sep 3, 2024
diff --git a/...igrations/versions/2024_09_04_1125-8bf414e0ddfb_remove_name_column_from_datasets_table.py b/...igrations/versions/2024_09_04_1125-8bf414e0ddfb_remove_name_column_from_datasets_table.py
@@ -0,0 +1,29 @@
+"""remove name column from datasets table
+
+Revision ID: 8bf414e0ddfb
+Revises: dd50d8e7777e
+Create Date: 2024-09-04 11:25:43.062068
+
+"""
+
+from typing import Sequence, Union
+
+import sqlalchemy as sa
+from alembic import op
+
+# revision identifiers, used by Alembic.
+revision: str = "8bf414e0ddfb"
+down_revision: Union[str, None] = "dd50d8e7777e"
+branch_labels: Union[str, Sequence[str], None] = None
+depends_on: Union[str, Sequence[str], None] = None
+
+
+def upgrade() -> None:
+    op.drop_column("datasets", "dataset_name")
+
+
+def downgrade() -> None:
+    op.add_column(
+        "datasets",
+        sa.Column("dataset_name", sa.String),
+    )
diff --git a/src/poprox_storage/concepts/experiment.py b/src/poprox_storage/concepts/experiment.py
@@ -6,8 +6,15 @@
 from pydantic import BaseModel, PositiveInt
 
 
+class Team(BaseModel):
+    team_id: UUID | None = None
+    team_name: str
+    members: list[UUID]
+
+
 class Experiment(BaseModel):
     experiment_id: UUID | None = None
+    owner: Team
     description: str
     start_date: date
     end_date: date

diff --git a/src/poprox_storage/concepts/manifest.py b/src/poprox_storage/concepts/manifest.py
@@ -2,15 +2,17 @@
 
 from copy import deepcopy
 from datetime import date, timedelta
-from uuid import UUID
+from uuid import UUID, uuid4
 
+import tomli
 from pydantic import BaseModel, PositiveInt
 
 from poprox_storage.concepts.experiment import (
     Experiment,
     Group,
     Phase,
     Recommender,
+    Team,
     Treatment,
 )
 
@@ -22,6 +24,7 @@ class ManifestFile(BaseModel):
     """
 
     experiment: ManifestExperiment
+    owner: ManifestTeam
     users: ManifestGroupSpec
     recommenders: dict[str, ManifestRecommender]
     phases: ManifestPhases
@@ -34,6 +37,12 @@ class ManifestExperiment(BaseModel):
     start_date: date | None = None
 
 
+class ManifestTeam(BaseModel):
+    team_id: UUID
+    team_name: str
+    members: list[UUID]
+
+
 class ManifestPhases(BaseModel):
     sequence: list[str]
     phases: dict[str, ManifestPhase]
@@ -85,34 +94,43 @@ def manifest_to_experiment(manifest: ManifestFile) -> Experiment:
     start_date = manifest.experiment.start_date or (date.today() + timedelta(days=1))  # noqa: DTZ011
     end_date = start_date + convert_duration(manifest.experiment.duration)
 
+    owner = Team(
+        team_id=manifest.owner.team_id,
+        team_name=manifest.owner.team_name,
+        members=manifest.owner.members,
+    )
+
     experiment = Experiment(
+        experiment_id=manifest.experiment.id,
+        owner=owner,
         start_date=start_date,
         end_date=end_date,
         description=manifest.experiment.description,
         phases=[],
     )
 
     recommenders = {
-        rec_name: Recommender(name=rec_name, endpoint_url=recommender.endpoint)
+        rec_name: Recommender(recommender_id=uuid4(), name=rec_name, endpoint_url=recommender.endpoint)
         for rec_name, recommender in manifest.recommenders.items()
     }
 
     groups = {}
     for group_name, group in manifest.users.groups.items():
         if group.identical_to:
             new_group = deepcopy(groups[group.identical_to])
+            new_group.group_id = uuid4()
             new_group.name = group_name
             groups[group_name] = new_group
         else:
-            groups[group_name] = Group(name=group_name, minimum_size=group.minimum_size)
+            groups[group_name] = Group(group_id=uuid4(), name=group_name, minimum_size=group.minimum_size)
 
     phase_start = start_date
     for phase_name in manifest.phases.sequence:
         manifest_phase = manifest.phases.phases[phase_name]
         duration = convert_duration(manifest_phase.duration)
         phase_start = start_date + sum([phase.duration for phase in experiment.phases], start=timedelta(0))
         phase_end = phase_start + duration
-        phase = Phase(name=phase_name, start_date=phase_start, end_date=phase_end, treatments=[])
+        phase = Phase(phase_id=uuid4(), name=phase_name, start_date=phase_start, end_date=phase_end, treatments=[])
         for group_name, assignment in manifest_phase.assignments.items():
             recommender_name = assignment.recommender
             phase.treatments.append(
@@ -137,3 +155,15 @@ def convert_duration(duration: str) -> timedelta:
             msg = f"Unsupported duration unit: {unit}"
             raise ValueError(msg)
     return duration
+
+
+def parse_manifest_toml(manifest_file: str):
+    manifest_dict = tomli.loads(manifest_file)
+    phases = {"sequence": manifest_dict["phases"]["sequence"], "phases": {}}
+    for name, phase in manifest_dict["phases"].items():
+        if name != "sequence":
+            phases["phases"][name] = phase
+
+    manifest_dict["phases"] = phases
+
+    return ManifestFile.model_validate(manifest_dict)
diff --git a/src/poprox_storage/paths.py b/src/poprox_storage/paths.py
@@ -0,0 +1,61 @@
+# pyright: strict
+from __future__ import annotations
+
+import logging
+from pathlib import Path
+from typing import overload
+
+logger = logging.getLogger(__name__)
+_cached_root: Path | None = None
+
+
+@overload
+def project_root() -> Path: ...
+@overload
+def project_root(*, require: bool) -> Path | None: ...
+def project_root(*, require: bool = True) -> Path | None:
+    """
+    Find the project root directory (when we are running in the project).
+
+    This searches upwards from the **current working directory** to find the
+    root of the project, which it identifies by the ``pyproject.toml`` file.  If
+    this function is called from a directory that is not within a checkout of
+    the ``poprox-recommender`` repository, it will raise an error.
+
+    Args:
+        require:
+            Whether to fail when the project root is not found, or return
+            ``None``. If ``require=False`` this function will stil fail on a
+            *defective* project root (contains an invalid ``pyproject.toml``).
+
+    Returns:
+        The full path to the project root directory.  If the project root is
+        not found and ``require=False``, returns ``None``.
+    """
+    global _cached_root
+    if _cached_root is None:
+        cwd = Path(".").resolve()
+        candidate = cwd
+        logger.debug("searching for project root upwards from %s", candidate)
+        while not _is_project_root(candidate):
+            candidate = candidate.parent
+            if not candidate or str(candidate) == "/":
+                if require:
+                    msg = f"cannot find project root for {cwd}"
+                    raise RuntimeError(msg)
+                else:
+                    # don't cache None
+                    return None
+
+        logger.debug("found project root at  %s", candidate)
+        _cached_root = candidate
+
+    return _cached_root
+
+
+def _is_project_root(path: Path) -> bool:
+    tomlf = path / "pyproject.toml"
+    if tomlf.exists():
+        return True
+    else:
+        return False
diff --git a/src/poprox_storage/repositories/accounts.py b/src/poprox_storage/repositories/accounts.py
@@ -55,6 +55,21 @@ def fetch_account_by_email(self, email: str) -> Account | None:
             return accounts[0]
         return None
 
+    def store_account(self, account: Account) -> UUID | None:
+        account_tbl = self.tables["accounts"]
+        query = (
+            sqlalchemy.insert(account_tbl)
+            .values(
+                account_id=account.account_id,
+                email=account.email,
+                source=account.source,
+                status="new_account",
+            )
+            .returning(account_tbl.c.account_id)
+        )
+        row = self.conn.execute(query).one_or_none()
+        return row.account_id
+
     def store_new_account(self, email: str, source: str) -> Account:
         account_tbl = self.tables["accounts"]
         query = (