sciagent code + Gitea Actions CI/CD

Co-Authored-By: Claude Opus 4.8 <noreply@anthropic.com>
2026-06-30 09:38:30 +07:00
commit 688fac73e9
1167 changed files with 158244 additions and 0 deletions
@@ -0,0 +1,23 @@
+# Build context for the frontend_user / frontend_admin images is the repo ROOT (the
+# npm workspace). Keep only root manifests + shared/ + the two app dirs; exclude the
+# rest so the context stays small. (be0 builds from ./be0 and is unaffected by this file.)
+**/node_modules
+**/dist
+**/dist-ssr
+.git
+.gitignore
+.dockerignore
+.claude
+docs
+be0
+fe0
+assets
+database
+Posgresdb
+scripts
+deploy
+*.md
+.env
+.env.*
+.DS_Store
+**/__pycache__
@@ -0,0 +1,105 @@
+# ============================================================
+# Production / docker-compose.prod.yml
+# -----------------------------------------------------------
+# 1. Copy:  cp .env.example .env
+# 2. Fill every value below (never commit .env — it is gitignored).
+# 3. Prefer strong random secrets:
+#       openssl rand -base64 32
+#
+# Before deploy:  ./scripts/verify-prod-env.sh
+# Full deploy:    ./scripts/deploy-prod.sh
+# Stack map (FE→BE→DB→MinIO): docs/deploy-stack-overview.md
+# Postgres / volume quirks: docs/deploy-production-docker.md
+#
+# If .env was ever committed to git, rotate ALL secrets below.
+# ============================================================
+
+# Public hostname or IP that browsers use to reach this machine.
+PUBLIC_HOST=your-public-hostname-or-ip.example.com
+
+FE_PORT=8081
+
+# Optional: admin/council SPA port. Bound to 127.0.0.1 only in docker-compose.prod.yml
+# (reach it via SSH tunnel or an authenticated reverse-proxy vhost). Defaults to 8082.
+# FE_ADMIN_PORT=8082
+
+# Optional: principal-investigator SPA port (research proposals + project cockpit). Defaults to 8083.
+# FE_INV_PORT=8083
+
+# Optional: publisher SPA port (research-result publication). Defaults to 8084.
+# FE_PUB_PORT=8084
+
+# Optional: extra CORS Allowed-Origins for be0 (comma-separated, no spaces). Production compose sets
+# CORS_ORIGINS to http://${PUBLIC_HOST}:${FE_PORT} plus these extras automatically.
+# CORS_ORIGINS_EXTRA=https://app.example.com,http://internal:8081
+
+MINIO_API_PORT=19000
+MINIO_CONSOLE_PORT=19001
+
+MINIO_ROOT_USER=minio_root_change_me
+MINIO_ROOT_PASSWORD=replace_with_long_random_secret
+
+# --- HTTPS for MinIO presigned URLs (required if the SPA is https://…) ------------
+# Mixed content blocks http://PUBLIC_HOST:19000 embedded from an HTTPS UI. Options:
+#   A) Proxied viewer only (already in-app) — no change needed for preview.
+#   B) HTTPS for direct MinIO links (iframe / “open presigned URL”) — put TLS in front
+#      of the S3 API port and align these with that public URL. See docs/minio-behind-https.md .
+# Example subdomain (recommended):
+# S3_PUBLIC_ENDPOINT_URL=https://minio-api.your-domain.com
+# MINIO_SERVER_URL=https://minio-api.your-domain.com
+# Optionally point the console at HTTPS too:
+# MINIO_BROWSER_REDIRECT_URL=https://minio-console.your-domain.com
+# If omitted, Compose keeps using http://${PUBLIC_HOST}:${MINIO_API_PORT} for both.
+
+# Username + password are fixed the first time the Postgres volume is created (see comment below).
+
+# Identifier only (letters, digits, underscore) — avoids URL / healthcheck pitfalls.
+POSTGRES_USER=postgres_app_user
+POSTGRES_PASSWORD=replace_with_long_random_secret
+
+# Optional: only for scripts/sync-postgres-app-password.sh when the app role is not superuser
+# or you must connect as a different DB superuser (e.g. postgres) to run ALTER ROLE.
+# POSTGRES_SUPERUSER=postgres
+
+# Database name created on first init (normally keep "initiatives").
+POSTGRES_DB=initiatives
+
+# --- Auth (required for production) ------------------------------------------------
+# Generate: openssl rand -base64 48
+JWT_SECRET=replace_with_openssl_rand_base64_48
+
+# MinIO browser CORS — your public SPA origin (scheme + host, no trailing slash).
+MINIO_API_CORS_ALLOW_ORIGIN=https://www.example.com
+
+# Postgres + password caveat:
+# Changing POSTGRES_USER/POSTGRES_PASSWORD here later does NOT change an existing Docker volume —
+# Postgres only reads them when /var/lib/postgresql/data is empty. If login fails after editing .env:
+# • Use the same password as first boot (e.g. dev stack used initiative / initiative_secret), or
+# • With docker-compose.prod.yml stopped: docker volume rm …_initiative_pg_data then up again (drops DB), or
+# • Run ./scripts/sync-postgres-app-password.sh to set the DB role password from this file (no wipe), or
+
+# ---------------------------------------------------------------------------
+# SMTP — outbound mail from be0 (registration OTP, password reset)
+# ---------------------------------------------------------------------------
+# docker-compose / docker-compose.prod passes these into the be0 container.
+# Compose substitutes ${SMTP_*} from THIS file (repo-root `.env`), not from be0/.env alone.
+# Omit AUTH_MAIL_LOG_ONLY (or set 0/false) when using real SMTP.
+#
+# SMTP_HOST=smtp.your-mail-provider.com
+# SMTP_PORT=587
+# SMTP_USER=your_smtp_username
+# SMTP_PASSWORD=your_smtp_password
+# AUTH_MAIL_FROM=noreply@your-institution.edu.vn
+# SMTP_USE_TLS=1
+#
+# Public URL of the web app (password-reset / verify links in email). Production example:
+# AUTH_PUBLIC_WEB_ORIGIN=https://your-app.example.com
+#
+# Dev-only: print OTP in be0 logs instead of sending mail
+# AUTH_MAIL_LOG_ONLY=1
+#
+# Microsoft 365 / Outlook (smtp.office365.com), log shows 535 Authentication unsuccessful:
+#   • SMTP_USER = full mailbox address; SMTP_PASSWORD = correct app password if MFA is enabled
+#     (not your normal web-login password unless basic auth is allowed — many tenants require app passwords).
+#   • Exchange admin: enable "Authenticated SMTP" for the mailbox; security defaults may block SMTP AUTH.
+#   • After editing .env: docker compose up -d be0 (so the container reloads env).
@@ -0,0 +1,99 @@
+name: CI/CD
+
+# Gitea Actions pipeline for the UMP / ImageHub monorepo.
+#   backend  — be0 (FastAPI, Python 3.11) pytest against a throwaway Postgres
+#   frontend — npm workspaces (shared + 4 Vite/React SPAs): typecheck, build, unit tests
+#   deploy   — on push to main only: build + `docker compose up -d` on the host runner
+#
+# Runner labels expected (act_runner registered on 103.149.170.102):
+#   ci      -> docker mode (clean, ephemeral)   used by backend + frontend
+#   deploy  -> host mode  (drives host docker)  used by deploy
+on:
+  push:
+    branches: [main]
+  pull_request:
+    branches: [main]
+
+jobs:
+  backend:
+    runs-on: ci
+    services:
+      postgres:
+        image: postgres:16-alpine
+        env:
+          POSTGRES_USER: initiative
+          POSTGRES_PASSWORD: initiative_secret
+          POSTGRES_DB: initiatives
+        ports:
+          - 5432:5432
+        options: >-
+          --health-cmd "pg_isready -U initiative -d initiatives"
+          --health-interval 5s --health-timeout 5s --health-retries 10
+    steps:
+      - uses: actions/checkout@v4
+      - uses: actions/setup-python@v5
+        with:
+          python-version: "3.11"
+      - name: Install backend deps (+ test deps)
+        working-directory: be0
+        run: |
+          python -m pip install --upgrade pip
+          pip install -r requirements-dev.txt
+      - name: Unit tests — pytest PER FILE (isolates asyncpg event loop per module)
+        working-directory: be0
+        env:
+          INITIATIVE_DATABASE_URL: postgresql+asyncpg://initiative:initiative_secret@postgres:5432/initiatives
+        run: |
+          set -e
+          fail=0
+          for f in tests/test_*.py; do
+            echo "::group::$f"
+            python -m pytest "$f" -q || fail=1
+            echo "::endgroup::"
+          done
+          exit $fail
+
+  frontend:
+    runs-on: ci
+    steps:
+      - uses: actions/checkout@v4
+      - uses: actions/setup-node@v4
+        with:
+          node-version: "20"
+      - name: Install (workspaces)
+        run: npm ci
+      - name: Typecheck (all workspaces)
+        run: npm run typecheck
+      - name: Build (all workspaces)
+        run: npm run build
+      - name: Unit tests (workspaces w/ vitest — shared, investigator, publisher)
+        run: npm test --workspaces --if-present
+
+  # Deploy runs in HOST mode from a PERSISTENT dir (NOT the ephemeral runner
+  # workspace): docker-compose.prod.yml bind-mounts ./assets/minio-data and
+  # ./be0, so MinIO data + submitted files must live on a stable host path or
+  # they would be wiped on every deploy.
+  deploy:
+    needs: [backend, frontend]
+    if: github.event_name == 'push' && github.ref == 'refs/heads/main'
+    runs-on: deploy
+    steps:
+      - name: Sync code to persistent deploy dir
+        run: |
+          set -euo pipefail
+          DEPLOY_DIR=/srv/sciagent
+          if [ ! -d "$DEPLOY_DIR/.git" ]; then
+            git clone http://localhost:3000/tlam89/sciagent.git "$DEPLOY_DIR"
+          fi
+          cd "$DEPLOY_DIR"
+          git fetch origin main
+          git reset --hard origin/main
+      - name: Materialize prod .env from secret
+        run: |
+          set -euo pipefail
+          printf '%s' "${{ secrets.PROD_ENV }}" > /srv/sciagent/.env
+          chmod 600 /srv/sciagent/.env
+      - name: Deploy stack (build locally, no registry pull)
+        run: cd /srv/sciagent && bash scripts/deploy-prod.sh --no-pull
+      - name: Stack health check
+        run: cd /srv/sciagent && bash scripts/check-prod-stack.sh
@@ -0,0 +1,41 @@
+# Logs
+logs
+*.log
+npm-debug.log*
+yarn-debug.log*
+yarn-error.log*
+pnpm-debug.log*
+lerna-debug.log*
+
+node_modules
+dist
+dist-ssr
+*.local
+
+# Editor directories and files
+.vscode/*
+!.vscode/extensions.json
+.idea
+.DS_Store
+*.suo
+*.ntvs*
+*.njsproj
+*.sln
+*.sw?
+
+# Secrets — commit only `.env.example`, never `.env`.
+.env
+
+.env.local
+.env.*.local
+ 
+# Keep the example/template
+!.env.example
+
+assets/minio-data/*
+
+be0/.venv/
+
+# HMW-mode marker — session-local toggle (/ultra-on … /ultra-off). Never commit;
+# committing it would leave a fresh `git clone` stuck in token-burn mode.
+.claude/hmw-mode.on
@@ -0,0 +1,201 @@
+Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+   1. Definitions.
+
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+
+   END OF TERMS AND CONDITIONS
+
+   APPENDIX: How to apply the Apache License to your work.
+
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "[]"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+
+   Copyright [yyyy] [name of copyright owner]
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
@@ -0,0 +1,137 @@
+-- =============================================================================
+-- CRUD PATTERNS — Sáng kiến application system
+-- =============================================================================
+
+-- =============================================================================
+-- CREATE: Submit a new application with multiple authors (atomic)
+-- =============================================================================
+BEGIN;
+  -- Set audit context
+  SELECT set_config('my.user_id', '42', true);
+
+  -- 1. Main record
+  INSERT INTO applications(code, title, registration_year, status, purpose,
+                           is_technical_solution, primary_unit_id, created_by)
+  VALUES ('SK-2025-007',
+          'Hệ thống tự động điền hồ sơ sáng kiến',
+          2025, 'DRAFT',
+          'Tự động hoá việc điền các mẫu số 01–04',
+          TRUE, 2, 42)
+  RETURNING application_id \gset
+
+  -- 2. Authors (defer contribution-sum check until COMMIT)
+  SET CONSTRAINTS trg_contribution_total DEFERRED;
+  INSERT INTO application_authors(application_id, user_id, contribution_pct, role, display_order) VALUES
+    (:application_id, 42, 60.00, 'PRIMARY',    1),
+    (:application_id, 13, 25.00, 'CO_AUTHOR',  2),
+    (:application_id, 27, 15.00, 'CO_AUTHOR',  3);
+
+  -- 3. Orgs that tested it
+  INSERT INTO application_adopters(application_id, org_name, address, field) VALUES
+    (:application_id, 'Phòng KHCN', '217 Hồng Bàng, Q.5', 'Cải cách hành chính');
+COMMIT;
+
+
+-- =============================================================================
+-- READ: Dashboard — paginated list with filters
+-- =============================================================================
+SELECT * FROM v_application_summary
+ WHERE registration_year = 2025
+   AND status = ANY(ARRAY['UNDER_REVIEW','EVALUATED']::text[])
+   AND title ILIKE '%động vật%'              -- uses trigram index
+ ORDER BY avg_score DESC NULLS LAST, submitted_at DESC
+ LIMIT 20 OFFSET 0;
+
+-- Read: full application with nested data (app layer usually does this as N queries
+-- or one JSON aggregate — here's the aggregate version)
+SELECT jsonb_build_object(
+  'application', to_jsonb(a.*),
+  'authors',     (SELECT jsonb_agg(jsonb_build_object(
+                    'user_id', u.user_id,
+                    'name',    u.full_name,
+                    'pct',     aa.contribution_pct,
+                    'role',    aa.role
+                  ) ORDER BY aa.display_order)
+                  FROM application_authors aa
+                  JOIN users u USING (user_id)
+                  WHERE aa.application_id = a.application_id),
+  'evaluations',(SELECT jsonb_agg(to_jsonb(e.*))
+                  FROM evaluations e WHERE e.application_id = a.application_id),
+  'attachments',(SELECT jsonb_agg(to_jsonb(att.*))
+                  FROM attachments att WHERE att.application_id = a.application_id)
+) AS document
+FROM applications a
+WHERE a.application_id = 1 AND a.deleted_at IS NULL;
+
+-- Full-text search (Vietnamese-friendly; combine with unaccent for better recall)
+SELECT application_id, code, title
+  FROM applications
+ WHERE to_tsvector('simple', title || ' ' || coalesce(introduction,''))
+    @@ plainto_tsquery('simple', 'đạo đức động vật')
+ ORDER BY registration_year DESC
+ LIMIT 10;
+
+
+-- =============================================================================
+-- UPDATE: Progress an application through the workflow
+-- =============================================================================
+-- Submit (DRAFT → SUBMITTED). Triggers populate submitted_at automatically.
+UPDATE applications SET status = 'SUBMITTED' WHERE application_id = 7;
+
+-- Assign to review panel
+UPDATE applications SET status = 'UNDER_REVIEW' WHERE application_id = 7;
+
+-- Upsert an evaluation (same evaluator re-scores)
+INSERT INTO evaluations (application_id, evaluator_id, novelty_score, effectiveness_score, conclusion)
+VALUES (7, 99, 32, 48, 'Đề nghị công nhận')
+ON CONFLICT (application_id, evaluator_id)
+DO UPDATE SET
+    novelty_score       = EXCLUDED.novelty_score,
+    effectiveness_score = EXCLUDED.effectiveness_score,
+    conclusion          = EXCLUDED.conclusion,
+    evaluated_at        = NOW();
+
+-- Update JSONB field: patch a single effectiveness sub-field
+UPDATE applications
+   SET effectiveness = effectiveness || jsonb_build_object(
+       'economic',
+       'Tiết kiệm ~30% thời gian xét duyệt'
+   )
+ WHERE application_id = 7;
+
+-- Partial update (PATCH-style) — only update provided fields. The app layer
+-- generates SET clauses from the non-null fields in the request body.
+UPDATE applications
+   SET title   = COALESCE($1, title),
+       purpose = COALESCE($2, purpose),
+       updated_at = NOW()
+ WHERE application_id = $3 AND deleted_at IS NULL
+RETURNING *;
+
+
+-- =============================================================================
+-- DELETE: Soft delete + restore
+-- =============================================================================
+-- Soft delete
+UPDATE applications SET deleted_at = NOW() WHERE application_id = 7;
+
+-- Restore
+UPDATE applications SET deleted_at = NULL WHERE application_id = 7;
+
+-- Hard delete (only for drafts, cascades to authors/evaluations/etc.)
+DELETE FROM applications
+ WHERE application_id = 7
+   AND status = 'DRAFT';
+
+
+-- =============================================================================
+-- ANALYTICS: Materialized-view refresh (run nightly via cron/pgAgent)
+-- =============================================================================
+REFRESH MATERIALIZED VIEW CONCURRENTLY mv_annual_stats;
+
+-- Leaderboard: top-scoring approved innovations
+SELECT code, title, avg_score
+  FROM v_application_summary
+ WHERE status = 'APPROVED'
+ ORDER BY avg_score DESC
+ LIMIT 10;
@@ -0,0 +1,422 @@
+-- =============================================================================
+-- SÁNG KIẾN (INNOVATION APPLICATION) DATABASE SCHEMA
+-- PostgreSQL 14+
+--
+-- Domain: Manage innovation applications at ĐHYD TP.HCM (Vietnamese medical
+-- university). Supports the full lifecycle: draft → submit → evaluate → approve.
+--
+-- Design principles:
+--   - 3NF for entities, JSONB for semi-structured/optional narrative
+--   - Soft delete (deleted_at) — legal/audit requires historical retention
+--   - State machine on applications.status enforced by trigger
+--   - Full audit_log via trigger on all CUD operations
+--   - Contribution % sums to 100 enforced by DEFERRABLE trigger
+-- =============================================================================
+
+CREATE EXTENSION IF NOT EXISTS pg_trgm;       -- fuzzy matching
+CREATE EXTENSION IF NOT EXISTS unaccent;      -- Vietnamese diacritics in search
+
+-- Convenience: updated_at auto-maintenance
+CREATE OR REPLACE FUNCTION touch_updated_at() RETURNS TRIGGER AS $$
+BEGIN NEW.updated_at := NOW(); RETURN NEW; END;
+$$ LANGUAGE plpgsql;
+
+
+-- =============================================================================
+-- REFERENCE: UNITS (departments, faculties, centers)
+-- =============================================================================
+CREATE TABLE units (
+    unit_id        SERIAL PRIMARY KEY,
+    code           VARCHAR(32) UNIQUE NOT NULL,
+    name           VARCHAR(255) NOT NULL,                         -- full Vietnamese name
+    parent_unit_id INT REFERENCES units(unit_id) ON DELETE SET NULL,
+    type           VARCHAR(32) NOT NULL
+                   CHECK (type IN ('TRUONG','KHOA','PHONG','BO_MON','TRUNG_TAM','KHAC')),
+    is_active      BOOLEAN NOT NULL DEFAULT TRUE,
+    created_at     TIMESTAMPTZ NOT NULL DEFAULT NOW(),
+    updated_at     TIMESTAMPTZ NOT NULL DEFAULT NOW()
+);
+CREATE TRIGGER trg_units_touch BEFORE UPDATE ON units
+    FOR EACH ROW EXECUTE FUNCTION touch_updated_at();
+
+
+-- =============================================================================
+-- USERS (unified: authors, evaluators, admins — a user can wear many hats)
+-- =============================================================================
+CREATE TABLE users (
+    user_id        SERIAL PRIMARY KEY,
+    full_name      VARCHAR(255) NOT NULL,
+    title          VARCHAR(64),            -- PGS.TS, TS., GS., CN., ThS.
+    date_of_birth  DATE,
+    email          VARCHAR(255) UNIQUE,
+    phone          VARCHAR(32),
+    id_number      VARCHAR(32) UNIQUE,     -- CCCD / hộ chiếu
+    unit_id        INT REFERENCES units(unit_id) ON DELETE SET NULL,
+    position       VARCHAR(255),           -- chức danh: Trưởng phòng, GV cao cấp
+    qualification  VARCHAR(64),            -- trình độ: Tiến sĩ, Thạc sĩ, Cử nhân
+    user_type      VARCHAR(32) NOT NULL DEFAULT 'AUTHOR'
+                   CHECK (user_type IN ('AUTHOR','COUNCIL','ADMIN','STUDENT','EXTERNAL')),
+    is_active      BOOLEAN NOT NULL DEFAULT TRUE,
+    deleted_at     TIMESTAMPTZ,            -- soft delete
+    created_at     TIMESTAMPTZ NOT NULL DEFAULT NOW(),
+    updated_at     TIMESTAMPTZ NOT NULL DEFAULT NOW()
+);
+CREATE INDEX idx_users_unit ON users(unit_id);
+CREATE INDEX idx_users_active ON users(is_active) WHERE deleted_at IS NULL;
+CREATE INDEX idx_users_name_trgm ON users USING GIN (full_name gin_trgm_ops);
+CREATE TRIGGER trg_users_touch BEFORE UPDATE ON users
+    FOR EACH ROW EXECUTE FUNCTION touch_updated_at();
+
+
+-- =============================================================================
+-- APPLICATIONS (sáng kiến) — the core entity
+-- =============================================================================
+CREATE TABLE applications (
+    application_id        SERIAL PRIMARY KEY,
+    code                  VARCHAR(32) UNIQUE NOT NULL,  -- e.g., 'SK-2025-001'
+    title                 TEXT NOT NULL,
+    title_en              TEXT,
+    registration_year     INT NOT NULL CHECK (registration_year BETWEEN 2000 AND 2100),
+    field_of_application  TEXT,                         -- lĩnh vực áp dụng
+
+    -- Workflow state (enforced by trigger below)
+    status                VARCHAR(32) NOT NULL DEFAULT 'DRAFT'
+                          CHECK (status IN (
+                            'DRAFT','SUBMITTED','UNDER_REVIEW',
+                            'EVALUATED','APPROVED','REJECTED','WITHDRAWN'
+                          )),
+
+    -- Mẫu 01 narrative (long text)
+    introduction          TEXT,         -- 1. Mở đầu
+    current_state         TEXT,         -- 4.1 Tình trạng đã biết
+    purpose               TEXT,         -- Mục đích
+    implementation_steps  TEXT,         -- Các bước thực hiện
+    required_conditions   TEXT,         -- Điều kiện cần thiết
+    results_achieved      TEXT,         -- Kết quả thu được
+    novelty_description   TEXT,         -- Tính mới
+    confidential_info     TEXT,         -- Thông tin cần bảo mật
+
+    -- 10 effectiveness sub-fields (all optional narrative) → JSONB
+    effectiveness         JSONB NOT NULL DEFAULT '{}'::jsonb,
+    -- Shape: { "economic":"...", "teaching":"...", "productivity":"...",
+    --          "work_efficiency":"...", "quality":"...", "cost_reduction":"...",
+    --          "environment":"...", "health":"...", "safety":"...", "awareness":"..." }
+
+    -- Mẫu 02 fields
+    owner_org             VARCHAR(255),       -- chủ đầu tư
+    first_applied_date    DATE,               -- ngày áp dụng lần đầu
+    content_summary       TEXT,               -- nội dung sáng kiến (short)
+    author_assessment     TEXT,               -- đánh giá theo tác giả
+    org_assessment        TEXT,               -- đánh giá theo tổ chức
+
+    -- Mẫu 02 classification (mutually exclusive in form, but stored as flags)
+    is_technical_solution     BOOLEAN NOT NULL DEFAULT FALSE,
+    is_from_research_article  BOOLEAN NOT NULL DEFAULT FALSE,
+    is_from_book_material     BOOLEAN NOT NULL DEFAULT FALSE,
+    CONSTRAINT chk_exactly_one_classification CHECK (
+        status = 'DRAFT' OR
+        (is_technical_solution::int + is_from_research_article::int + is_from_book_material::int) = 1
+    ),
+
+    -- Workflow timestamps
+    submitted_at          TIMESTAMPTZ,
+    decided_at            TIMESTAMPTZ,
+
+    primary_unit_id       INT REFERENCES units(unit_id),
+    created_by            INT REFERENCES users(user_id),
+    deleted_at            TIMESTAMPTZ,        -- soft delete
+    created_at            TIMESTAMPTZ NOT NULL DEFAULT NOW(),
+    updated_at            TIMESTAMPTZ NOT NULL DEFAULT NOW()
+);
+
+CREATE INDEX idx_apps_status ON applications(status) WHERE deleted_at IS NULL;
+CREATE INDEX idx_apps_year ON applications(registration_year);
+CREATE INDEX idx_apps_unit ON applications(primary_unit_id);
+CREATE INDEX idx_apps_title_trgm ON applications USING GIN (title gin_trgm_ops);
+CREATE INDEX idx_apps_fts ON applications USING GIN (
+    to_tsvector('simple',
+        coalesce(title,'') || ' ' ||
+        coalesce(introduction,'') || ' ' ||
+        coalesce(novelty_description,'')
+    )
+);
+CREATE INDEX idx_apps_effectiveness ON applications USING GIN (effectiveness);
+CREATE TRIGGER trg_apps_touch BEFORE UPDATE ON applications
+    FOR EACH ROW EXECUTE FUNCTION touch_updated_at();
+
+
+-- =============================================================================
+-- APPLICATION_AUTHORS (M:N with contribution %)
+-- =============================================================================
+CREATE TABLE application_authors (
+    application_id   INT NOT NULL REFERENCES applications(application_id) ON DELETE CASCADE,
+    user_id          INT NOT NULL REFERENCES users(user_id),
+    contribution_pct NUMERIC(5,2) NOT NULL CHECK (contribution_pct > 0 AND contribution_pct <= 100),
+    role             VARCHAR(32) NOT NULL DEFAULT 'CO_AUTHOR'
+                     CHECK (role IN ('PRIMARY','CO_AUTHOR')),
+    display_order    INT NOT NULL DEFAULT 0,
+    PRIMARY KEY (application_id, user_id)
+);
+CREATE INDEX idx_app_authors_user ON application_authors(user_id);
+
+-- At most one PRIMARY author per application
+CREATE UNIQUE INDEX uq_primary_per_app
+    ON application_authors(application_id) WHERE role = 'PRIMARY';
+
+-- Deferrable check: contribution % must total 100 per application
+CREATE OR REPLACE FUNCTION check_contribution_total() RETURNS TRIGGER AS $$
+DECLARE v_total NUMERIC; v_app INT;
+BEGIN
+    v_app := COALESCE(NEW.application_id, OLD.application_id);
+    SELECT COALESCE(SUM(contribution_pct),0) INTO v_total
+      FROM application_authors WHERE application_id = v_app;
+    -- Only enforce when application has left DRAFT
+    IF (SELECT status FROM applications WHERE application_id = v_app) <> 'DRAFT'
+       AND v_total <> 100 THEN
+        RAISE EXCEPTION 'Contribution % for application % must sum to 100 (got %)',
+            '%', v_app, v_total;
+    END IF;
+    RETURN NULL;
+END;
+$$ LANGUAGE plpgsql;
+
+CREATE CONSTRAINT TRIGGER trg_contribution_total
+    AFTER INSERT OR UPDATE OR DELETE ON application_authors
+    DEFERRABLE INITIALLY DEFERRED
+    FOR EACH ROW EXECUTE FUNCTION check_contribution_total();
+
+
+-- =============================================================================
+-- ORGS that tested / adopted the innovation (Mẫu 01 inner table)
+-- =============================================================================
+CREATE TABLE application_adopters (
+    adopter_id      SERIAL PRIMARY KEY,
+    application_id  INT NOT NULL REFERENCES applications(application_id) ON DELETE CASCADE,
+    display_order   INT NOT NULL DEFAULT 0,
+    org_name        VARCHAR(255) NOT NULL,
+    address         TEXT,
+    field           TEXT
+);
+CREATE INDEX idx_adopters_app ON application_adopters(application_id);
+
+
+-- =============================================================================
+-- PARTICIPANTS in first application (Mẫu 02 inner table)
+-- =============================================================================
+CREATE TABLE application_participants (
+    participant_id  SERIAL PRIMARY KEY,
+    application_id  INT NOT NULL REFERENCES applications(application_id) ON DELETE CASCADE,
+    user_id         INT REFERENCES users(user_id),        -- optional link
+    display_order   INT NOT NULL DEFAULT 0,
+    full_name       VARCHAR(255) NOT NULL,
+    date_of_birth   DATE,
+    work_unit       VARCHAR(255),
+    position        VARCHAR(255),
+    qualification   VARCHAR(64),
+    support_content TEXT
+);
+CREATE INDEX idx_participants_app ON application_participants(application_id);
+
+
+-- =============================================================================
+-- EVALUATIONS (Mẫu 04) — council members score applications
+-- =============================================================================
+CREATE TABLE evaluations (
+    evaluation_id         SERIAL PRIMARY KEY,
+    application_id        INT NOT NULL REFERENCES applications(application_id) ON DELETE CASCADE,
+    evaluator_id          INT NOT NULL REFERENCES users(user_id),
+
+    novelty_comments      TEXT,
+    novelty_score         INT NOT NULL DEFAULT 0
+                          CHECK (novelty_score BETWEEN 0 AND 40),
+
+    effectiveness_comments TEXT,
+    effectiveness_score   INT NOT NULL DEFAULT 0
+                          CHECK (effectiveness_score BETWEEN 0 AND 60),
+
+    total_score           INT GENERATED ALWAYS AS (novelty_score + effectiveness_score) STORED,
+    conclusion            TEXT,
+    evaluated_at          TIMESTAMPTZ NOT NULL DEFAULT NOW(),
+
+    UNIQUE (application_id, evaluator_id)
+);
+CREATE INDEX idx_eval_app ON evaluations(application_id);
+CREATE INDEX idx_eval_evaluator ON evaluations(evaluator_id);
+
+
+-- =============================================================================
+-- COMMITMENTS (Bản cam kết) — for paper-based innovations
+-- =============================================================================
+CREATE TABLE commitments (
+    commitment_id             SERIAL PRIMARY KEY,
+    application_id            INT NOT NULL REFERENCES applications(application_id) ON DELETE CASCADE,
+    user_id                   INT NOT NULL REFERENCES users(user_id),
+
+    paper_title               TEXT,
+    role_type                 VARCHAR(32) NOT NULL
+                              CHECK (role_type IN ('PRIMARY_AUTHOR','CO_AUTHOR')),
+
+    -- 5 commitment checkboxes
+    is_legal_owner            BOOLEAN NOT NULL DEFAULT FALSE,
+    is_authorized_by_owner    BOOLEAN NOT NULL DEFAULT FALSE,
+    has_coauthor_consent      BOOLEAN NOT NULL DEFAULT FALSE,
+    not_predatory_journal     BOOLEAN NOT NULL DEFAULT FALSE,
+    complies_with_ip_law      BOOLEAN NOT NULL DEFAULT FALSE,
+
+    signed_at                 TIMESTAMPTZ NOT NULL DEFAULT NOW(),
+
+    UNIQUE (application_id, user_id)
+);
+CREATE INDEX idx_commit_app ON commitments(application_id);
+
+
+-- =============================================================================
+-- ATTACHMENTS (uploaded files — figures, flowcharts, annexes)
+-- =============================================================================
+CREATE TABLE attachments (
+    attachment_id   SERIAL PRIMARY KEY,
+    application_id  INT NOT NULL REFERENCES applications(application_id) ON DELETE CASCADE,
+    file_name       VARCHAR(255) NOT NULL,
+    file_path       TEXT NOT NULL,                 -- S3/MinIO key
+    file_size       BIGINT,
+    mime_type       VARCHAR(128),
+    kind            VARCHAR(32)                    -- 'LUU_DO', 'PHU_LUC', 'KY_SO', 'KHAC'
+                    CHECK (kind IS NULL OR kind IN ('LUU_DO','PHU_LUC','KY_SO','KHAC')),
+    uploaded_by     INT REFERENCES users(user_id),
+    uploaded_at     TIMESTAMPTZ NOT NULL DEFAULT NOW()
+);
+CREATE INDEX idx_attach_app ON attachments(application_id);
+
+
+-- =============================================================================
+-- AUDIT LOG — single table, populated by triggers on all CUD operations
+-- =============================================================================
+CREATE TABLE audit_log (
+    log_id       BIGSERIAL PRIMARY KEY,
+    table_name   VARCHAR(64) NOT NULL,
+    record_id    TEXT NOT NULL,
+    action       VARCHAR(16) NOT NULL CHECK (action IN ('INSERT','UPDATE','DELETE')),
+    changed_by   INT,                   -- set from app via SET LOCAL my.user_id
+    changed_at   TIMESTAMPTZ NOT NULL DEFAULT NOW(),
+    old_data     JSONB,
+    new_data     JSONB
+);
+CREATE INDEX idx_audit_table_record ON audit_log(table_name, record_id);
+CREATE INDEX idx_audit_user_time ON audit_log(changed_by, changed_at DESC);
+
+-- Generic audit trigger function
+CREATE OR REPLACE FUNCTION audit_trigger() RETURNS TRIGGER AS $$
+DECLARE
+    v_user INT;
+    v_pk   TEXT;
+BEGIN
+    -- Get user_id from session var if app sets it; else NULL
+    BEGIN v_user := current_setting('my.user_id')::INT;
+    EXCEPTION WHEN OTHERS THEN v_user := NULL; END;
+
+    v_pk := COALESCE(
+        (row_to_json(NEW)::jsonb->>TG_ARGV[0]),
+        (row_to_json(OLD)::jsonb->>TG_ARGV[0])
+    );
+
+    INSERT INTO audit_log(table_name, record_id, action, changed_by, old_data, new_data)
+    VALUES (
+        TG_TABLE_NAME,
+        v_pk,
+        TG_OP,
+        v_user,
+        CASE WHEN TG_OP IN ('UPDATE','DELETE') THEN to_jsonb(OLD) END,
+        CASE WHEN TG_OP IN ('INSERT','UPDATE') THEN to_jsonb(NEW) END
+    );
+    RETURN COALESCE(NEW, OLD);
+END;
+$$ LANGUAGE plpgsql;
+
+-- Attach audit trigger to the important tables (pass PK column name as arg)
+CREATE TRIGGER trg_audit_applications AFTER INSERT OR UPDATE OR DELETE ON applications
+    FOR EACH ROW EXECUTE FUNCTION audit_trigger('application_id');
+CREATE TRIGGER trg_audit_authors AFTER INSERT OR UPDATE OR DELETE ON application_authors
+    FOR EACH ROW EXECUTE FUNCTION audit_trigger('application_id');
+CREATE TRIGGER trg_audit_evaluations AFTER INSERT OR UPDATE OR DELETE ON evaluations
+    FOR EACH ROW EXECUTE FUNCTION audit_trigger('evaluation_id');
+CREATE TRIGGER trg_audit_commitments AFTER INSERT OR UPDATE OR DELETE ON commitments
+    FOR EACH ROW EXECUTE FUNCTION audit_trigger('commitment_id');
+
+
+-- =============================================================================
+-- WORKFLOW STATE MACHINE ENFORCEMENT
+-- =============================================================================
+CREATE OR REPLACE FUNCTION enforce_application_transitions() RETURNS TRIGGER AS $$
+DECLARE
+    allowed BOOLEAN := FALSE;
+BEGIN
+    IF OLD.status = NEW.status THEN RETURN NEW; END IF;
+
+    -- Allowed transitions
+    allowed := CASE
+      WHEN OLD.status = 'DRAFT'        AND NEW.status IN ('SUBMITTED','WITHDRAWN') THEN TRUE
+      WHEN OLD.status = 'SUBMITTED'    AND NEW.status IN ('UNDER_REVIEW','WITHDRAWN','DRAFT') THEN TRUE
+      WHEN OLD.status = 'UNDER_REVIEW' AND NEW.status IN ('EVALUATED','WITHDRAWN') THEN TRUE
+      WHEN OLD.status = 'EVALUATED'    AND NEW.status IN ('APPROVED','REJECTED') THEN TRUE
+      ELSE FALSE
+    END;
+
+    IF NOT allowed THEN
+        RAISE EXCEPTION 'Invalid status transition: % → %', OLD.status, NEW.status;
+    END IF;
+
+    -- Auto-set timestamps
+    IF NEW.status = 'SUBMITTED' AND OLD.status = 'DRAFT' THEN
+        NEW.submitted_at := NOW();
+    END IF;
+    IF NEW.status IN ('APPROVED','REJECTED') THEN
+        NEW.decided_at := NOW();
+    END IF;
+
+    RETURN NEW;
+END;
+$$ LANGUAGE plpgsql;
+
+CREATE TRIGGER trg_app_state_machine
+    BEFORE UPDATE OF status ON applications
+    FOR EACH ROW EXECUTE FUNCTION enforce_application_transitions();
+
+
+-- =============================================================================
+-- CONVENIENCE VIEWS
+-- =============================================================================
+
+-- Dashboard: applications with author names and current evaluation average
+CREATE VIEW v_application_summary AS
+SELECT
+    a.application_id,
+    a.code,
+    a.title,
+    a.status,
+    a.registration_year,
+    u.name AS primary_unit_name,
+    (SELECT string_agg(usr.full_name, ', ' ORDER BY aa.display_order)
+       FROM application_authors aa
+       JOIN users usr ON usr.user_id = aa.user_id
+      WHERE aa.application_id = a.application_id) AS author_names,
+    (SELECT ROUND(AVG(total_score),2)
+       FROM evaluations WHERE application_id = a.application_id) AS avg_score,
+    (SELECT COUNT(*) FROM evaluations WHERE application_id = a.application_id) AS num_evaluations,
+    a.submitted_at,
+    a.decided_at
+FROM applications a
+LEFT JOIN units u ON u.unit_id = a.primary_unit_id
+WHERE a.deleted_at IS NULL;
+
+-- Materialized view: annual approval statistics (refresh nightly)
+CREATE MATERIALIZED VIEW mv_annual_stats AS
+SELECT
+    registration_year,
+    COUNT(*) FILTER (WHERE status = 'APPROVED') AS approved,
+    COUNT(*) FILTER (WHERE status = 'REJECTED') AS rejected,
+    COUNT(*) FILTER (WHERE status NOT IN ('APPROVED','REJECTED')) AS pending,
+    COUNT(*) AS total
+FROM applications
+WHERE deleted_at IS NULL
+GROUP BY registration_year;
+CREATE UNIQUE INDEX ON mv_annual_stats(registration_year);
@@ -0,0 +1,83 @@
+-- Validation tests: run in a single transaction per block
+-- ===========================================================
+
+-- 1. SEED: units + users
+INSERT INTO units(code, name, type) VALUES
+  ('DHYD', 'Đại học Y Dược TP.HCM', 'TRUONG'),
+  ('KHCN', 'Phòng Khoa học Công nghệ', 'PHONG');
+
+INSERT INTO users(full_name, title, email, id_number, unit_id, qualification, user_type) VALUES
+  ('Trần Hùng',         'PGS.TS', 'tranhung@ump.edu.vn',    '001001', 1, 'Tiến sĩ', 'AUTHOR'),
+  ('Đỗ Quốc Vũ',        'CN.',    'doquocvu@ump.edu.vn',    '001002', 2, 'Cử nhân', 'AUTHOR'),
+  ('Nguyễn Hội đồng A', 'PGS.TS', 'hdA@ump.edu.vn',         '002001', 1, 'Tiến sĩ', 'COUNCIL');
+
+-- 2. CREATE an application in DRAFT state
+INSERT INTO applications(code, title, registration_year, status, purpose, primary_unit_id, created_by)
+VALUES ('SK-2025-001',
+        'Quy trình xét duyệt Đạo đức trong nghiên cứu trên động vật',
+        2025, 'DRAFT',
+        'Chuẩn hoá quy trình xét duyệt hồ sơ',
+        2, 2);
+
+-- 3. ADD authors with DEFERRED constraint (sums to 100 at COMMIT)
+BEGIN;
+INSERT INTO application_authors(application_id, user_id, contribution_pct, role) VALUES
+  (1, 1, 50, 'CO_AUTHOR'),
+  (1, 2, 50, 'PRIMARY');
+-- At this point sum=100, but app is DRAFT so constraint doesn't even care yet
+COMMIT;
+
+-- Verify
+SELECT 'Authors inserted:' AS step, count(*) FROM application_authors;
+
+-- 4. TRY to submit the application (DRAFT → SUBMITTED): needs classification
+--    This should FAIL the check constraint because no classification flag is set
+\echo 'Test 4: should FAIL (missing classification)'
+UPDATE applications SET status='SUBMITTED' WHERE application_id=1;
+\echo ''
+
+-- Fix and retry
+UPDATE applications
+   SET is_technical_solution = TRUE,
+       status = 'SUBMITTED'
+ WHERE application_id = 1;
+SELECT 'After submit:' AS step, status, submitted_at FROM applications WHERE application_id=1;
+
+-- 5. TRY invalid transition SUBMITTED → APPROVED (should FAIL)
+\echo 'Test 5: should FAIL (illegal transition)'
+UPDATE applications SET status='APPROVED' WHERE application_id=1;
+\echo ''
+
+-- Valid transitions
+UPDATE applications SET status='UNDER_REVIEW' WHERE application_id=1;
+
+-- 6. EVALUATOR scores the application
+INSERT INTO evaluations(application_id, evaluator_id, novelty_score, effectiveness_score, conclusion)
+VALUES (1, 3, 35, 50, 'Đề xuất công nhận');
+
+SELECT 'Evaluation:' AS step, novelty_score, effectiveness_score, total_score FROM evaluations;
+
+-- 7. Move to EVALUATED → APPROVED
+UPDATE applications SET status='EVALUATED' WHERE application_id=1;
+UPDATE applications SET status='APPROVED' WHERE application_id=1;
+
+SELECT 'Final status:' AS step, status, decided_at IS NOT NULL AS has_decision_time
+  FROM applications WHERE application_id=1;
+
+-- 8. READ: summary view
+SELECT code, title, status, author_names, avg_score, num_evaluations
+  FROM v_application_summary;
+
+-- 9. AUDIT trail: who changed what?
+SELECT table_name, action, changed_at,
+       (new_data->>'status') AS new_status
+  FROM audit_log
+ WHERE table_name = 'applications'
+ ORDER BY log_id;
+
+-- 10. Bad contribution sum should fail at COMMIT
+\echo 'Test 10: should FAIL (sum != 100 on submitted app)'
+BEGIN;
+  UPDATE application_authors SET contribution_pct = 30 WHERE application_id=1 AND user_id=1;
+  -- sum is now 30+50=80, but app is APPROVED so trigger will reject at commit
+COMMIT;
@@ -0,0 +1,254 @@
+Initiative Management System
+
+The platform consists of two main services:
+
+- **Frontend**: React-based web application with TypeScript and Vite
+- **Backend**: FastAPI-based REST API with Python 3.11
+- **AI Integration**: Ollama-powered document analysis and compliance checking
+
+## Project Structure
+
+```
+poc/
+├── fe0/                    # Frontend service
+│   ├── src/               # React application source
+│   ├── public/            # Static assets
+│   ├── package.json       # Node.js dependencies
+│   └── Dockerfile         # Frontend container
+├── be0/                   # Backend service
+│   ├── src/               # Python application source
+│   ├── main.py           # FastAPI application entry point
+│   ├── requirements.txt  # Python dependencies
+│   └── Dockerfile        # Backend container
+├── assets/               # Shared resources and data
+└── docker-compose.yml    # Service orchestration
+```
+
+## Prerequisites
+
+- Docker 20.10+
+- Docker Compose 2.0+
+- Git
+
+## Quick Start
+
+1. **Clone and setup**
+   ```bash
+   git clone <repository-url>
+   cd poc
+   ```
+
+2. **Start all services**
+   ```bash
+   docker-compose up --build
+   ```
+
+3. **Access the application**
+   - **Frontend**: http://localhost:8081
+   - **Backend API**: http://localhost:4402
+   - **API Documentation**: http://localhost:4402/docs
+
+## Development Setup
+
+### Frontend Development
+
+```bash
+cd fe0
+npm install
+npm run dev
+```
+
+**Available Scripts:**
+- `npm run dev` - Start development server
+- `npm run build` - Build for production
+- `npm run preview` - Preview production build
+- `npm run lint` - Run ESLint
+
+**Technology Stack:**
+- React 18 with TypeScript
+- Vite for build tooling
+- Tailwind CSS for styling
+- shadcn/ui component library
+- React Router for navigation
+- TanStack Query for state management
+
+### Backend Development
+
+```bash
+cd be0
+pip install -r requirements.txt
+uvicorn main:app --host 0.0.0.0 --port 4402 --reload
+```
+
+**Technology Stack:**
+- FastAPI framework
+- Python 3.11
+- Pydantic for data validation
+- LangChain for AI workflows
+- Ollama for local AI models
+- PDF processing with PyPDF and Docling
+
+## API Documentation
+
+### Core Endpoints
+
+#### Workflow Management
+- `POST /workflows` - Initialize new compliance workflow
+- `GET /workflows/{workflow_id}` - Retrieve workflow status
+- `PUT /workflows/{workflow_id}/items` - Update workflow items
+- `POST /workflows/{workflow_id}/approvals` - Submit approvals
+- `GET /workflows/{workflow_id}/report` - Generate status reports
+- `POST /workflows/{workflow_id}/advance` - Progress to next phase
+
+#### Document Processing
+- `POST /upload_document` - Upload and parse documents
+- `POST /get_page` - Retrieve specific document pages
+- `POST /test_ollama` - Test AI model connectivity
+
+#### System Health
+- `GET /health` - Service health check
+- `GET /` - API information and available endpoints
+
+### Request/Response Examples
+
+**Create Workflow:**
+```json
+POST /workflows
+{
+  "project_name": "ISO 27001 Implementation",
+  "project_description": "Implement ISO 27001 controls",
+  "records_officer_email": "officer@company.com"
+}
+```
+
+**Update Workflow Item:**
+```json
+PUT /workflows/{workflow_id}/items
+{
+  "item_id": 1,
+  "status": "completed",
+  "comment": "Implementation completed",
+  "updated_by": "john.doe@company.com"
+}
+```
+
+## Configuration
+
+### Environment Variables
+
+| Variable | Description | Default |
+|----------|-------------|---------|
+| `GENERIC_TIMEZONE`` | Application timezone | `UTC` |
+| `NVIDIA_VISIBLE_DEVICES` | GPU access for AI models | `all` |
+| `NVIDIA_DRIVER_CAPABILITIES` | GPU capabilities | `compute,utility` |
+
+### Docker Network Configuration
+
+Services communicate via a custom Docker network (`profyt-net`) with static IP addressing:
+- Frontend: `192.168.42.20`
+- Backend: `192.168.42.22`
+
+## Features
+
+### Compliance Management
+- **ISO 27001** compliance tracking and reporting
+- **Records Management** integration workflows
+- **Risk Assessment** tools and dashboards
+- **Document Processing** with AI-powered analysis
+
+### Workflow Engine
+- Multi-phase compliance workflows
+- Approval management system
+- Progress tracking and reporting
+- Integration with external systems
+
+### AI-Powered Analysis
+- Document parsing and content extraction
+- Compliance gap analysis
+- Automated report generation
+- Natural language processing for policy analysis
+
+## Deployment
+
+### Production Deployment
+
+On the **application host** (SSH), from the repository root:
+
+1. **Secrets & config**
+   ```bash
+   cp .env.example .env
+   # Edit .env: PUBLIC_HOST, ports, MinIO and Postgres credentials (openssl rand -base64 32).
+   # Never commit `.env`. Postgres user/password apply only on FIRST empty DB volume — see `.env.example`.
+   ./scripts/verify-prod-env.sh
+   ```
+
+2. **Deploy (pull, build, recreate containers)**
+   ```bash
+   ./scripts/deploy-prod.sh
+   # Air-gapped / no registry pull:
+   # ./scripts/deploy-prod.sh --no-pull
+   ```
+
+   Or manually (must pass `/.env` explicitly if it is not named `.env` next to the compose file):
+   ```bash
+   docker compose --env-file .env -f docker-compose.prod.yml pull
+   docker compose --env-file .env -f docker-compose.prod.yml up -d --build --remove-orphans
+   ```
+
+3. **Smoke checks** (`FE_PORT` and API port come from `.env` / compose; API is `127.0.0.1:4402` in prod compose)
+   ```bash
+   # Replace 8081 with the FE_PORT value in .env when different.
+   curl -sf http://127.0.0.1:8081/
+   curl -sf http://127.0.0.1:4402/health
+   ```
+
+### Scaling Considerations
+
+- **Frontend**: Stateless, horizontally scalable
+- **Backend**: Consider database persistence for production
+- **AI Models**: GPU requirements for optimal performance
+- **Storage**: Implement proper file storage for documents
+
+## Monitoring and Logging
+
+### Application Logs
+- Frontend logs: Available via Docker logs
+- Backend logs: Stored in `be0/logs/` directory
+- System logs: `docker-compose logs [service-name]`
+
+### Health Monitoring
+- Health check endpoints available
+- Docker health checks configured
+- Log aggregation recommended for production
+
+## Security Considerations
+
+### Current Implementation
+- CORS enabled for cross-origin requests
+- Input validation via Pydantic models
+- File upload restrictions
+
+### Production Recommendations
+- Implement authentication/authorization
+- Add rate limiting
+- Enable HTTPS/TLS
+- Implement proper secret management
+- Add audit logging
+
+## Contributing
+
+1. Fork the repository
+2. Create a feature branch (`git checkout -b feature/amazing-feature`)
+3. Commit your changes (`git commit -m 'Add amazing feature'`)
+4. Push to the branch (`git push origin feature/amazing-feature`)
+5. Open a Pull Request
+
+### Development Guidelines
+- Follow TypeScript best practices
+- Write comprehensive tests
+- Update documentation for new features
+- Follow conventional commit messages
+
+## License
+
+This project is licensed under the terms specified in the LICENSE file.
@@ -0,0 +1,29 @@
+# Copy to .env and adjust. docker-compose sets these for the be0 service when using the repo stack.
+INITIATIVE_DATABASE_URL=postgresql+asyncpg://initiative:initiative_secret@localhost:15432/initiatives
+
+# S3 / MinIO — server-to-server (API → object store)
+S3_ENDPOINT_URL=http://localhost:19000
+S3_ACCESS_KEY=minio_user
+S3_SECRET_KEY=minio_password
+S3_BUCKET_ATTACHMENTS=initiative-attachments
+S3_BUCKET_EXPORTS=initiative-exports
+S3_BUCKET_QUARANTINE=initiative-quarantine
+
+# Optional: HTTPS base for presigned URLs (must match public MinIO TLS host; see docs/minio-behind-https.md)
+# S3_PUBLIC_ENDPOINT_URL=https://minio-api.example.com
+
+# Optional: comma-separated extra browser origins for CORS (merged with localhost defaults in main.py).
+# In Docker dev stack, docker-compose.yml can set this; production compose adds your public UI URL automatically.
+# CORS_ORIGINS=http://YOUR_LAN_IP:8081
+
+# Local Python runs may load this file; Docker Compose uses the repo-root `.env` for ${SMTP_*} → be0.
+# Password reset email (same SMTP block as `.env.example` beside docker-compose for dev stack.)
+# OTP + reset use src/auth_mail.py: set SMTP_* for Option A or AUTH_MAIL_LOG_ONLY=1 locally.
+# AUTH_MAIL_LOG_ONLY=1
+# AUTH_PUBLIC_WEB_ORIGIN=http://localhost:8081
+# SMTP_HOST=smtp.example.com
+# SMTP_PORT=587
+# SMTP_USER=
+# SMTP_PASSWORD=
+# AUTH_MAIL_FROM=noreply@example.com
+# SMTP_USE_TLS=1
@@ -0,0 +1,223 @@
+# Chat Assistant Module
+
+## Overview
+
+The Chat Assistant module provides a conversational AI interface for answering policy and compliance questions using Ollama.
+
+## Architecture
+
+### Backend (`be0/src/chat_assistant.py`)
+
+The `ChatAssistant` class provides:
+- **Chat functionality**: Conversational AI for policy questions
+- **Content verification**: Verify content against compliance requirements
+- **Policy Q&A**: Answer questions about policies and compliance
+
+### Frontend (`fe0/src/features/chat/`)
+
+The frontend chat feature includes:
+- **Service layer**: API communication with backend
+- **React hooks**: Easy-to-use hooks for chat functionality
+- **Type definitions**: TypeScript types for type safety
+
+## API Endpoints
+
+### 1. Chat Endpoint
+```
+POST /api/v1/chat
+```
+
+**Request Body:**
+```json
+{
+  "message": "What are ISO 27001 requirements?",
+  "conversation_history": [
+    {
+      "role": "user",
+      "content": "Previous message"
+    },
+    {
+      "role": "assistant",
+      "content": "Previous response"
+    }
+  ],
+  "context": "Optional context about policies"
+}
+```
+
+**Response:**
+```json
+{
+  "message": "ISO 27001 is an information security management system...",
+  "model": "gemma3:27b",
+  "tokens_used": 150
+}
+```
+
+### 2. Verify Content Endpoint
+```
+POST /api/v1/chat/verify
+```
+
+**Form Data:**
+- `field_name`: Name of the field being verified
+- `content`: Content to verify
+- `verification_criteria`: (Optional) Specific criteria to check
+
+**Response:**
+```json
+{
+  "message": "The content meets compliance requirements...",
+  "model": "gemma3:27b",
+  "tokens_used": 200
+}
+```
+
+### 3. Policy Question Endpoint
+```
+POST /api/v1/chat/question
+```
+
+**Form Data:**
+- `question`: The user's question
+- `policy_context`: (Optional) Context about specific policies
+
+**Response:**
+```json
+{
+  "message": "Answer to the policy question...",
+  "model": "gemma3:27b",
+  "tokens_used": 180
+}
+```
+
+## Features
+
+### 1. Conversational Context
+- Maintains conversation history for context-aware responses
+- Keeps last 10 messages for context
+- System prompt guides the assistant's behavior
+
+### 2. Policy Expertise
+- Specialized in IT governance and compliance
+- Knowledgeable about ISO 27001, NIST, GDPR, etc.
+- Provides accurate, actionable advice
+
+### 3. Content Verification
+- Analyzes content against compliance requirements
+- Provides detailed feedback
+- Suggests improvements
+
+## Usage
+
+### Backend
+
+```python
+from src.chat_assistant import get_chat_assistant
+
+# Get chat assistant instance
+assistant = get_chat_assistant()
+
+# Chat
+request = ChatRequest(
+    message="What is ISO 27001?",
+    context="IT governance"
+)
+response = await assistant.chat(request)
+
+# Verify content
+response = await assistant.verify_content(
+    field_name="Project Description",
+    content="Our project implements security controls..."
+)
+```
+
+### Frontend
+
+```typescript
+import { useChat } from '@/features/chat/hooks/useChat';
+
+const { sendMessage, verifyContent, isLoading } = useChat();
+
+// Send a message
+const response = await sendMessage(
+  "What are compliance requirements?",
+  conversationHistory, // Optional
+  "ISO 27001 context"   // Optional
+);
+
+// Verify content
+const verification = await verifyContent(
+  "Project Name",
+  "Project content to verify"
+);
+```
+
+## Configuration
+
+### Model Selection
+
+The default model is `gemma3:27b`. To change it:
+
+```python
+# In chat_assistant.py
+assistant = ChatAssistant(model_name="your-model-name")
+```
+
+### System Prompt
+
+The system prompt can be customized in the `ChatAssistant.__init__` method to change the assistant's behavior and expertise.
+
+## Logging
+
+All chat interactions are logged to:
+- `be0/logs/ChatAssistant.log`
+
+This helps with debugging and monitoring.
+
+## Error Handling
+
+The module includes comprehensive error handling:
+- Catches and logs all exceptions
+- Returns user-friendly error messages
+- Raises HTTPException for API errors
+
+## Testing
+
+To test the chat assistant:
+
+1. **Start the backend:**
+   ```bash
+   cd be0
+   docker-compose up be0
+   ```
+
+2. **Test via API:**
+   ```bash
+   curl -X POST http://localhost:4402/api/v1/chat \
+     -H "Content-Type: application/json" \
+     -d '{"message": "What is ISO 27001?"}'
+   ```
+
+3. **Test via Frontend:**
+   - Open the Dashboard
+   - Use the ChatAssistant component
+   - Ask questions or verify content
+
+## Integration
+
+The ChatAssistant is integrated with:
+- **ChatAssistant.tsx**: React component in the Dashboard
+- **useChat hook**: React hook for chat functionality
+- **chatService**: API service layer
+
+## Future Enhancements
+
+Potential improvements:
+1. Streaming responses for real-time text generation
+2. Multi-turn conversation management
+3. Document context injection
+4. Voice input/output
+5. Response rating and feedback
+6. Conversation export
+7. Custom model fine-tuning
@@ -0,0 +1,34 @@
+FROM python:3.11
+
+# Set the working directory
+WORKDIR /app
+
+# Copy the requirements file
+COPY ./requirements.txt /app/
+
+# Install dependencies and set up Python environment
+RUN apt-get update && apt-get install -y --no-install-recommends \
+    zstd \
+    curl \
+    git \
+    build-essential \
+    python3-pip \
+    libreoffice-writer-nogui \
+    && rm -rf /var/lib/apt/lists/*
+
+# RUN curl -fsSL https://ollama.com/install.sh | sh
+
+
+RUN pip install --upgrade pip
+
+WORKDIR /app
+
+RUN pip install --no-cache-dir -r requirements.txt
+RUN pip install nltk
+# Avoid runtime GitHub downloads (slow/hanging in some networks) before Uvicorn starts.
+RUN python3 -m nltk.downloader punkt punkt_tab stopwords averaged_perceptron_tagger_eng wordnet
+
+COPY . /app/
+
+EXPOSE 4402 
+ENTRYPOINT ["/app/entrypoint.sh"]
@@ -0,0 +1,172 @@
+# Governance Layer Status in be0
+
+## Current State
+
+### ✅ What EXISTS (Current Implementation)
+
+The current `be0` codebase has:
+
+1. **Basic Workflow System** (`src/domain/entities/workflow.py`, `src/application/services/workflow_service.py`)
+   - SDLC/RM Integration workflow
+   - Phase-based progression
+   - Task/checklist management
+   - **Location**: `be0/src/domain/entities/workflow.py`
+
+2. **Compliance Verification** (`src/compliance_verifier.py`)
+   - Ollama-based compliance checking
+   - Text generation and similarity analysis
+   - **Location**: `be0/src/compliance_verifier.py`
+
+3. **Chat Assistant** (`src/chat_assistant.py`)
+   - Policy Q&A functionality
+   - Content verification
+   - **Location**: `be0/src/chat_assistant.py`
+
+4. **Architecture Foundation**
+   - Domain/Application/Infrastructure layers
+   - Repository pattern
+   - API routes structure
+   - **Location**: `be0/src/domain/`, `be0/src/application/`, `be0/src/api/`
+
+---
+
+## ❌ What's MISSING (Governance Layer for Initiatives)
+
+The **Grassroots Initiative Recognition System** governance layer has **NOT been implemented yet**. 
+
+### Missing Components:
+
+#### 1. **Initiative Management**
+- ❌ Initiative entity (initiative_id, group_type, status, etc.)
+- ❌ Author management (contribution percentages, lead author logic)
+- ❌ Unit/Appraisal Team entities
+- **Should be in**: `be0/src/domain/entities/initiative.py`
+
+#### 2. **Business Rules Engine**
+- ❌ Novelty checker (duplicate detection)
+- ❌ Scoring algorithm (Group 01 dual/triple reviewer)
+- ❌ Auto-classification (Group 02)
+- ❌ Author contribution validator
+- **Should be in**: `be0/src/domain/rules/` or `be0/src/application/rules/`
+
+#### 3. **Workflow State Machine**
+- ❌ Initiative state transitions (DRAFT → SUBMITTED → UNIT_REVIEW → etc.)
+- ❌ Deadline enforcement
+- ❌ SLA tracking
+- **Should be in**: `be0/src/application/state_machine.py` or `be0/src/domain/workflows/initiative_workflow.py`
+
+#### 4. **Review Management**
+- ❌ Review assignment logic
+- ❌ Blind review enforcement
+- ❌ Score conflict detection
+- ❌ Reviewer assignment service
+- **Should be in**: `be0/src/application/services/review_service.py`
+
+#### 5. **Document Management**
+- ❌ Form templates (Form 01, 03, 05, 06)
+- ❌ Document versioning
+- ❌ File storage integration
+- **Should be in**: `be0/src/infrastructure/storage/`
+
+#### 6. **API Endpoints**
+- ❌ `/api/v1/initiatives` (CRUD)
+- ❌ `/api/v1/initiatives/{id}/submit`
+- ❌ `/api/v1/initiatives/{id}/reviews`
+- ❌ `/api/v1/reviews/{review_id}/score`
+- ❌ `/api/v1/initiatives/{id}/appeal`
+- **Should be in**: `be0/src/api/routes/initiatives.py`
+
+---
+
+## Recommended Structure for Governance Layer
+
+```
+be0/src/
+├── domain/
+│   ├── entities/
+│   │   ├── initiative.py          # ❌ MISSING
+│   │   ├── author.py              # ❌ MISSING
+│   │   ├── review.py              # ❌ MISSING
+│   │   ├── unit.py                # ❌ MISSING
+│   │   └── appraisal_team.py      # ❌ MISSING
+│   ├── rules/
+│   │   ├── novelty_checker.py     # ❌ MISSING
+│   │   ├── scoring_engine.py      # ❌ MISSING
+│   │   ├── duplicate_detector.py  # ❌ MISSING
+│   │   └── classification_engine.py # ❌ MISSING
+│   └── workflows/
+│       └── initiative_workflow.py  # ❌ MISSING
+├── application/
+│   ├── services/
+│   │   ├── initiative_service.py   # ❌ MISSING
+│   │   ├── review_service.py       # ❌ MISSING
+│   │   ├── notification_service.py # ❌ MISSING
+│   │   └── deadline_service.py    # ❌ MISSING
+│   └── state_machine.py            # ❌ MISSING
+├── infrastructure/
+│   ├── storage/
+│   │   └── file_storage.py         # ❌ MISSING
+│   └── database/
+│       └── models.py               # ❌ MISSING (SQLAlchemy models)
+└── api/
+    └── routes/
+        ├── initiatives.py          # ❌ MISSING
+        ├── reviews.py              # ❌ MISSING
+        └── reports.py              # ❌ MISSING
+```
+
+---
+
+## What to Build Next
+
+Based on the simplified tech stack we discussed, here's the implementation order:
+
+### Phase 1: Core Entities & Database
+1. Create database models (PostgreSQL)
+2. Create domain entities (Initiative, Author, Review, etc.)
+3. Create repository interfaces
+
+### Phase 2: Business Rules
+1. Novelty checker (using PostgreSQL pg_trgm)
+2. Scoring engine
+3. Auto-classification logic
+
+### Phase 3: Workflow
+1. State machine implementation
+2. Transition rules
+3. Deadline tracking
+
+### Phase 4: API & Services
+1. Initiative service
+2. Review service
+3. API endpoints
+4. Document upload
+
+---
+
+## Current vs. Required
+
+| Component | Current | Required | Status |
+|-----------|---------|----------|--------|
+| Workflow (SDLC) | ✅ | ✅ | Implemented |
+| Initiative Management | ❌ | ✅ | **Missing** |
+| Business Rules | ❌ | ✅ | **Missing** |
+| Review System | ❌ | ✅ | **Missing** |
+| State Machine | ❌ | ✅ | **Missing** |
+| Document Storage | ❌ | ✅ | **Missing** |
+| Scoring Engine | ❌ | ✅ | **Missing** |
+
+---
+
+## Next Steps
+
+To implement the governance layer:
+
+1. **Start with database schema** - Create PostgreSQL tables for initiatives, authors, reviews
+2. **Create domain entities** - Python classes for Initiative, Author, Review
+3. **Implement business rules** - Novelty checker, scoring engine
+4. **Build state machine** - Workflow transitions
+5. **Create API endpoints** - RESTful APIs for frontend
+6. **Add document storage** - Local filesystem integration
+
+The foundation (layered architecture, FastAPI, PostgreSQL) is already in place - you just need to build the governance-specific components on top of it.
@@ -0,0 +1,150 @@
+# Chat Assistant Troubleshooting Guide
+
+## Common Errors and Solutions
+
+### Error: 500 Internal Server Error
+
+This usually indicates one of the following issues:
+
+#### 1. Ollama Not Running
+
+**Symptoms:**
+- 500 error on `/api/v1/chat`
+- Error message mentions "connection" or "refused"
+
+**Solution:**
+```bash
+# Check if Ollama is running in the container
+docker exec be0 ps aux | grep ollama
+
+# If not running, restart the container
+docker-compose restart be0
+
+# Or start Ollama manually
+docker exec be0 ollama serve &
+```
+
+#### 2. Model Not Available
+
+**Symptoms:**
+- Error mentions "model not found"
+- Model name mismatch
+
+**Solution:**
+```bash
+# Check available models
+docker exec be0 ollama list
+
+# Pull the required model
+docker exec be0 ollama pull gemma3:270M
+
+# Verify model is available
+docker exec be0 ollama list | grep gemma3
+```
+
+#### 3. Model Name Mismatch
+
+**Issue:** Code uses `gemma3:27b` but entrypoint pulls `gemma3:270M`
+
+**Solution:**
+The code has been updated to use `gemma3:270M` to match the entrypoint script.
+
+#### 4. Network Connectivity
+
+**Symptoms:**
+- Connection refused errors
+- Timeout errors
+
+**Solution:**
+```bash
+# Check if Ollama is accessible from within the container
+docker exec be0 curl http://localhost:11434/api/tags
+
+# Check Ollama service status
+docker exec be0 ollama list
+```
+
+## Diagnostic Endpoints
+
+### Health Check
+```bash
+curl http://localhost:4402/health
+```
+
+This will show:
+- Overall service status
+- Ollama connection status
+- Available models
+
+### Test Ollama Directly
+```bash
+# From inside the container
+docker exec be0 ollama run gemma3:270M "Hello"
+```
+
+## Debugging Steps
+
+1. **Check Backend Logs:**
+   ```bash
+   docker-compose logs be0 | tail -50
+   ```
+
+2. **Check Chat Assistant Logs:**
+   ```bash
+   tail -f be0/logs/ChatAssistant.log
+   ```
+
+3. **Test API Endpoint:**
+   ```bash
+   curl -X POST http://localhost:4402/api/v1/chat \
+     -H "Content-Type: application/json" \
+     -d '{"message": "Hello"}'
+   ```
+
+4. **Verify Ollama Service:**
+   ```bash
+   docker exec be0 ollama list
+   docker exec be0 curl http://localhost:11434/api/tags
+   ```
+
+## Common Fixes
+
+### Fix 1: Restart Ollama Service
+```bash
+docker exec be0 pkill ollama
+docker exec be0 ollama serve &
+sleep 2
+docker exec be0 ollama list
+```
+
+### Fix 2: Pull Missing Model
+```bash
+docker exec be0 ollama pull gemma3:270M
+```
+
+### Fix 3: Restart Container
+```bash
+docker-compose restart be0
+```
+
+### Fix 4: Rebuild Container
+```bash
+docker-compose down
+docker-compose build be0
+docker-compose up be0
+```
+
+## Expected Behavior
+
+When working correctly:
+1. Health endpoint shows Ollama as "connected"
+2. Available models list includes `gemma3:270M`
+3. Chat endpoint returns 200 with a response
+4. Logs show successful message processing
+
+## Still Having Issues?
+
+1. Check the full error in logs: `docker-compose logs be0`
+2. Verify Ollama is running: `docker exec be0 ps aux | grep ollama`
+3. Test Ollama directly: `docker exec be0 ollama run gemma3:270M "test"`
+4. Check model availability: `docker exec be0 ollama list`
@@ -0,0 +1,46 @@
+#!/bin/bash
+
+if command -v ollama >/dev/null 2>&1; then
+  echo "Starting Ollama server..."
+  ollama serve &
+  sleep 1
+else
+  echo "Ollama not installed in this image; skipping."
+fi
+
+# if ! ollama list | grep -q "qwen2.5:3b"; then
+#     echo "Model qwen2.5:3b not found. Pulling..."
+#     ollama pull qwen2.5:3b
+
+# else
+#     echo "Model qwen2.5:3b already exists. Skipping pull."
+# fi
+
+# #download embedding model
+# if ! ollama list | grep -q "embeddinggemma:300m"; then
+#     echo "Model embeddinggemma:300m not found. Pulling..."
+#     ollama pull embeddinggemma:300m
+
+# else
+#     echo "Model embeddinggemma:300m already exists. Skipping pull."
+# fi
+
+# NLTK corpora are installed when the image is built (see Dockerfile).
+# Bind mount overwrites /app; image site-packages may be stale vs mounted requirements.txt.
+if [ -f /app/requirements.txt ]; then
+  echo "Installing/updating Python deps from mounted /app/requirements.txt..."
+  pip install --no-cache-dir -r /app/requirements.txt || {
+    echo "ERROR: pip install -r /app/requirements.txt failed; fix deps and restart be0."
+    exit 1
+  }
+fi
+
+echo "Applying idempotent initiative DB migrations (008–014 incl. registration_otp_codes) if needed..."
+python /app/scripts/apply_initiative_migrations.py || echo "WARNING: apply_initiative_migrations exited non-zero — check be0 logs (API may return 503 for evidence/artifacts until DB is fixed)."
+
+echo "Starting FastAPI..."
+if [ "${UVICORN_RELOAD:-0}" = "1" ]; then
+  exec uvicorn main:app --host 0.0.0.0 --port 4402 --reload
+else
+  exec uvicorn main:app --host 0.0.0.0 --port 4402
+fi
@@ -0,0 +1,251 @@
+-- Initiative Recognition System — PostgreSQL schema (architecture_plan.md §4)
+-- Table order respects FKs (units before users).
+
+CREATE EXTENSION IF NOT EXISTS citext;
+
+-- =========  ENUMS  =========
+DO $$ BEGIN
+  CREATE TYPE user_role AS ENUM ('applicant','council_member','editor','admin','viewer');
+EXCEPTION WHEN duplicate_object THEN NULL;
+END $$;
+
+DO $$ BEGIN
+  CREATE TYPE initiative_class AS ENUM ('technical','research','textbook');
+EXCEPTION WHEN duplicate_object THEN NULL;
+END $$;
+
+DO $$ BEGIN
+  CREATE TYPE research_evidence AS ENUM ('international','domestic','poster');
+EXCEPTION WHEN duplicate_object THEN NULL;
+END $$;
+
+DO $$ BEGIN
+  CREATE TYPE eval_level AS ENUM ('high','medium','low');
+EXCEPTION WHEN duplicate_object THEN NULL;
+END $$;
+
+DO $$ BEGIN
+  CREATE TYPE submission_status AS ENUM ('draft','submitted','under_review','approved','rejected');
+EXCEPTION WHEN duplicate_object THEN NULL;
+END $$;
+
+DO $$ BEGIN
+  CREATE TYPE recognition_tier AS ENUM ('excellent','good');
+EXCEPTION WHEN duplicate_object THEN NULL;
+END $$;
+
+-- =========  IDENTITY  =========
+CREATE TABLE IF NOT EXISTS units (
+  id        UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  name      TEXT NOT NULL,
+  parent_id UUID REFERENCES units(id),
+  address   TEXT
+);
+
+CREATE TABLE IF NOT EXISTS users (
+  id              UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  email           CITEXT UNIQUE NOT NULL,
+  password_hash   TEXT NOT NULL,
+  full_name       TEXT NOT NULL,
+  phone           TEXT,
+  unit_id         UUID REFERENCES units(id),
+  is_active       BOOLEAN NOT NULL DEFAULT TRUE,
+  created_at      TIMESTAMPTZ NOT NULL DEFAULT now(),
+  updated_at      TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+
+CREATE TABLE IF NOT EXISTS user_roles (
+  user_id UUID NOT NULL REFERENCES users(id) ON DELETE CASCADE,
+  role    user_role NOT NULL,
+  PRIMARY KEY (user_id, role)
+);
+
+-- System user for anonymous draft saves (no login yet)
+INSERT INTO users (id, email, password_hash, full_name)
+VALUES (
+  '00000000-0000-4000-8000-000000000001',
+  'system@draft.local',
+  '-',
+  'System (draft owner)'
+)
+ON CONFLICT (email) DO NOTHING;
+
+-- =========  CASE / INITIATIVE ROOT  =========
+CREATE TABLE IF NOT EXISTS initiatives (
+  id              UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  case_code       TEXT UNIQUE NOT NULL,
+  owner_id        UUID NOT NULL REFERENCES users(id),
+  status          submission_status NOT NULL DEFAULT 'draft',
+  recognition_tier recognition_tier,
+  submitted_at    TIMESTAMPTZ,
+  created_at      TIMESTAMPTZ NOT NULL DEFAULT now(),
+  updated_at      TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+CREATE INDEX IF NOT EXISTS idx_initiatives_owner_status ON initiatives(owner_id, status);
+
+-- =========  DRAFT SNAPSHOTS  =========
+CREATE TABLE IF NOT EXISTS drafts (
+  id              UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  draft_code      TEXT UNIQUE NOT NULL,
+  initiative_id   UUID NOT NULL REFERENCES initiatives(id) ON DELETE CASCADE,
+  payload         JSONB NOT NULL,
+  version         INTEGER NOT NULL DEFAULT 1,
+  updated_at      TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+CREATE INDEX IF NOT EXISTS idx_drafts_initiative ON drafts(initiative_id);
+
+-- =========  ĐƠN (APPLICATION)  =========
+CREATE TABLE IF NOT EXISTS applications (
+  initiative_id              UUID PRIMARY KEY REFERENCES initiatives(id) ON DELETE CASCADE,
+  initiative_name            TEXT NOT NULL,
+  investor_name              TEXT,
+  application_field          TEXT,
+  first_apply_date           DATE,
+  initiative_classification  initiative_class,
+  research_evidence_kind     research_evidence,
+  international_journal_decl TEXT,
+  content_summary            TEXT,
+  confidential_info          TEXT,
+  conditions                 TEXT,
+  author_evaluation          TEXT,
+  trial_evaluation           TEXT,
+  submission_day             SMALLINT,
+  submission_month           SMALLINT,
+  submission_year            SMALLINT,
+  honesty_confirmed          BOOLEAN NOT NULL DEFAULT FALSE,
+  CONSTRAINT chk_first_apply_window
+     CHECK (first_apply_date IS NULL
+            OR first_apply_date BETWEEN DATE '2025-04-15' AND DATE '2026-04-15')
+);
+
+CREATE TABLE IF NOT EXISTS authors (
+  id                   UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  initiative_id        UUID NOT NULL REFERENCES initiatives(id) ON DELETE CASCADE,
+  user_id              UUID REFERENCES users(id),
+  ordinal              SMALLINT NOT NULL,
+  full_name            TEXT NOT NULL,
+  dob                  DATE,
+  workplace            TEXT,
+  title                TEXT,
+  qualification        TEXT,
+  contribution_percent NUMERIC(5,2) NOT NULL,
+  is_representative    BOOLEAN NOT NULL DEFAULT FALSE,
+  CHECK (contribution_percent >= 0 AND contribution_percent <= 100)
+);
+CREATE UNIQUE INDEX IF NOT EXISTS uq_authors_repr ON authors(initiative_id) WHERE is_representative;
+
+CREATE TABLE IF NOT EXISTS support_staff (
+  id              UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  initiative_id   UUID NOT NULL REFERENCES initiatives(id) ON DELETE CASCADE,
+  full_name       TEXT,
+  dob             DATE,
+  workplace       TEXT,
+  title           TEXT,
+  qualification   TEXT,
+  support_content TEXT
+);
+
+CREATE TABLE IF NOT EXISTS evidence_files (
+  id              UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  initiative_id   UUID NOT NULL REFERENCES initiatives(id) ON DELETE CASCADE,
+  kind            TEXT NOT NULL CHECK (kind IN ('textbook','research','technical')),
+  storage_uri     TEXT NOT NULL,
+  original_name   TEXT NOT NULL,
+  mime_type       TEXT NOT NULL DEFAULT 'application/pdf',
+  byte_size       BIGINT NOT NULL,
+  sha256          CHAR(64) NOT NULL,
+  uploaded_by     UUID NOT NULL REFERENCES users(id),
+  uploaded_at     TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+CREATE UNIQUE INDEX IF NOT EXISTS uq_evidence_kind ON evidence_files(initiative_id, kind);
+
+-- =========  BÁO CÁO (REPORT)  =========
+CREATE TABLE IF NOT EXISTS reports (
+  initiative_id        UUID PRIMARY KEY REFERENCES initiatives(id) ON DELETE CASCADE,
+  introduction         TEXT,
+  representative_phone TEXT,
+  representative_email TEXT,
+  current_status       TEXT,
+  purpose              TEXT,
+  implementation_steps TEXT,
+  first_applied_unit   TEXT,
+  achieved_result      TEXT,
+  novelty              TEXT,
+  effectiveness        JSONB NOT NULL DEFAULT '{}'::jsonb,
+  submission_date      DATE
+);
+
+CREATE TABLE IF NOT EXISTS trial_units (
+  id              UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  initiative_id   UUID NOT NULL REFERENCES initiatives(id) ON DELETE CASCADE,
+  name            TEXT NOT NULL,
+  address         TEXT,
+  field           TEXT,
+  ordinal         SMALLINT
+);
+
+-- =========  CONTRIBUTION CONFIRMATION  =========
+CREATE TABLE IF NOT EXISTS contributions (
+  initiative_id               UUID PRIMARY KEY REFERENCES initiatives(id) ON DELETE CASCADE,
+  main_author                 TEXT NOT NULL,
+  position                    TEXT,
+  representative_percent      NUMERIC(5,2),
+  submission_date             TIMESTAMPTZ,
+  digital_signature_confirmed BOOLEAN NOT NULL DEFAULT FALSE
+);
+
+CREATE TABLE IF NOT EXISTS contribution_participants (
+  id                   UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  initiative_id        UUID NOT NULL REFERENCES initiatives(id) ON DELETE CASCADE,
+  full_name            TEXT,
+  work_unit            TEXT,
+  contribution_percent NUMERIC(5,2)
+);
+
+-- =========  PHIẾU ĐÁNH GIÁ  =========
+CREATE TABLE IF NOT EXISTS evaluations (
+  id                    UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  initiative_id         UUID NOT NULL REFERENCES initiatives(id) ON DELETE CASCADE,
+  council_member_id     UUID NOT NULL REFERENCES users(id),
+  position              TEXT,
+  evaluation_date       DATE NOT NULL,
+  novelty_level         eval_level,
+  novelty_score         SMALLINT,
+  novelty_comment       TEXT,
+  effectiveness_level   eval_level,
+  effectiveness_score   SMALLINT,
+  effectiveness_comment TEXT,
+  total_score           SMALLINT GENERATED ALWAYS AS
+                        (COALESCE(novelty_score,0) + COALESCE(effectiveness_score,0)) STORED,
+  conclusion            TEXT,
+  status                submission_status NOT NULL DEFAULT 'draft',
+  submitted_at          TIMESTAMPTZ,
+  created_at            TIMESTAMPTZ NOT NULL DEFAULT now(),
+  CHECK (novelty_score       IS NULL OR (novelty_score BETWEEN 0 AND 40)),
+  CHECK (effectiveness_score IS NULL OR (effectiveness_score BETWEEN 0 AND 60)),
+  UNIQUE (initiative_id, council_member_id)
+);
+CREATE INDEX IF NOT EXISTS idx_eval_initiative ON evaluations(initiative_id);
+
+-- =========  ADMIN VERIFY  =========
+CREATE TABLE IF NOT EXISTS verifications (
+  id            UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  initiative_id UUID NOT NULL REFERENCES initiatives(id) ON DELETE CASCADE,
+  field_name    TEXT NOT NULL,
+  content_hash  CHAR(64) NOT NULL,
+  verified_by   UUID NOT NULL REFERENCES users(id),
+  verified_at   TIMESTAMPTZ NOT NULL DEFAULT now(),
+  result        TEXT
+);
+
+-- =========  AUDIT TRAIL  =========
+CREATE TABLE IF NOT EXISTS audit_log (
+  id          BIGSERIAL PRIMARY KEY,
+  actor_id    UUID REFERENCES users(id),
+  action      TEXT NOT NULL,
+  entity      TEXT NOT NULL,
+  entity_id   UUID NOT NULL,
+  diff        JSONB,
+  occurred_at TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+CREATE INDEX IF NOT EXISTS idx_audit_entity ON audit_log(entity, entity_id);
@@ -0,0 +1,71 @@
+-- Versioned tab payloads + immutable submit snapshots + workflow/taxonomy + artifact registry.
+-- Apply on existing DBs: psql "$INITIATIVE_DATABASE_URL" -f migrations/002_application_storage_extensions.sql
+-- (use sync driver URL, not asyncpg, for psql)
+
+-- =========  DRAFT TAB SNAPSHOTS (fe0: report | application | contribution)  =========
+CREATE TABLE IF NOT EXISTS draft_tab_snapshots (
+  id              UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  initiative_id   UUID NOT NULL REFERENCES initiatives(id) ON DELETE CASCADE,
+  draft_id        UUID REFERENCES drafts(id) ON DELETE SET NULL,
+  tab             TEXT NOT NULL CHECK (tab IN ('report', 'application', 'contribution')),
+  tab_version     INTEGER NOT NULL DEFAULT 1,
+  payload         JSONB NOT NULL DEFAULT '{}'::jsonb,
+  source          TEXT NOT NULL DEFAULT 'autosave',
+  captured_at     TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+CREATE INDEX IF NOT EXISTS idx_draft_tab_snapshots_init_tab_ver
+  ON draft_tab_snapshots (initiative_id, tab, tab_version DESC);
+CREATE INDEX IF NOT EXISTS idx_draft_tab_snapshots_captured
+  ON draft_tab_snapshots (captured_at DESC);
+
+-- =========  SUBMIT SNAPSHOTS (immutable row per successful submit)  =========
+CREATE TABLE IF NOT EXISTS application_submit_snapshots (
+  id                    UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  initiative_id         UUID NOT NULL REFERENCES initiatives(id) ON DELETE CASCADE,
+  submission_record_id  TEXT NOT NULL,
+  merged_tabs           JSONB NOT NULL DEFAULT '{}'::jsonb,
+  submit_metadata       JSONB NOT NULL DEFAULT '{}'::jsonb,
+  full_pdf_uri          TEXT NOT NULL,
+  captured_at           TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+CREATE INDEX IF NOT EXISTS idx_submit_snapshots_init_time
+  ON application_submit_snapshots (initiative_id, captured_at DESC);
+
+-- =========  WORKFLOW / LIST PROJECTION (council fields)  =========
+CREATE TABLE IF NOT EXISTS application_workflow (
+  initiative_id    UUID PRIMARY KEY REFERENCES initiatives(id) ON DELETE CASCADE,
+  review_status    TEXT NOT NULL DEFAULT 'not_reviewed',
+  review_deadline  DATE,
+  reviewer         JSONB,
+  supervisor       JSONB,
+  conference       JSONB,
+  updated_at       TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+
+-- =========  TAXONOMY (subjectId, groupId, topicType from fe0 ApplicationItem)  =========
+CREATE TABLE IF NOT EXISTS application_taxonomy (
+  initiative_id UUID PRIMARY KEY REFERENCES initiatives(id) ON DELETE CASCADE,
+  subject_id    TEXT NOT NULL DEFAULT '',
+  group_id      TEXT NOT NULL DEFAULT '',
+  topic_type    TEXT NOT NULL DEFAULT '',
+  updated_at    TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+
+-- =========  ARTIFACTS (PDF + future abstract/poster URIs; complements evidence_files)  =========
+CREATE TABLE IF NOT EXISTS application_artifacts (
+  id             UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  initiative_id  UUID NOT NULL REFERENCES initiatives(id) ON DELETE CASCADE,
+  role           TEXT NOT NULL CHECK (role IN (
+    'full_pdf', 'abstract', 'poster',
+    'textbook_evidence', 'research_evidence', 'technical_evidence', 'other'
+  )),
+  storage_uri    TEXT NOT NULL,
+  original_name  TEXT,
+  mime_type      TEXT NOT NULL DEFAULT 'application/pdf',
+  byte_size      BIGINT,
+  sha256         CHAR(64),
+  uploaded_by    UUID REFERENCES users(id),
+  uploaded_at    TIMESTAMPTZ NOT NULL DEFAULT now(),
+  UNIQUE (initiative_id, role)
+);
+CREATE INDEX IF NOT EXISTS idx_application_artifacts_init ON application_artifacts (initiative_id);
@@ -0,0 +1,22 @@
+-- Persist ReviewPanel JSON bundles (templateData + officialBieuMau + full trees)
+-- Apply on existing DBs:
+--   psql "$INITIATIVE_DATABASE_URL" -f migrations/003_review_documents.sql
+
+CREATE TABLE IF NOT EXISTS application_review_documents (
+  id                 UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  initiative_id      UUID NOT NULL REFERENCES initiatives(id) ON DELETE CASCADE,
+  case_id            TEXT NOT NULL,
+  document_version   INTEGER NOT NULL DEFAULT 1,
+  official_bieu_mau  JSONB NOT NULL DEFAULT '{}'::jsonb,
+  template_data      JSONB,
+  full_bundle        JSONB,
+  created_by         UUID REFERENCES users(id),
+  created_at         TIMESTAMPTZ NOT NULL DEFAULT now(),
+  UNIQUE (initiative_id, document_version)
+);
+
+CREATE INDEX IF NOT EXISTS idx_review_docs_initiative_time
+  ON application_review_documents (initiative_id, created_at DESC);
+CREATE INDEX IF NOT EXISTS idx_review_docs_case_time
+  ON application_review_documents (case_id, created_at DESC);
+
@@ -0,0 +1,18 @@
+-- Admin-recorded adjudication outcome per initiative (linked to applicant application id API).
+-- One row per initiative; CRUD via /api/applications/{applicationId}/admin-result
+
+CREATE TABLE IF NOT EXISTS application_admin_results (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  initiative_id UUID NOT NULL REFERENCES initiatives(id) ON DELETE CASCADE,
+  decision TEXT NOT NULL CHECK (decision IN ('approved','rejected')),
+  feedback TEXT NOT NULL DEFAULT '',
+  rationale TEXT,
+  created_at TIMESTAMPTZ NOT NULL DEFAULT now(),
+  updated_at TIMESTAMPTZ NOT NULL DEFAULT now(),
+  created_by UUID REFERENCES users(id),
+  updated_by UUID REFERENCES users(id),
+  CONSTRAINT uq_application_admin_results_initiative UNIQUE (initiative_id)
+);
+
+CREATE INDEX IF NOT EXISTS idx_application_admin_results_initiative
+  ON application_admin_results(initiative_id);
@@ -0,0 +1,13 @@
+-- Evidence staff review (approve / reject) on application_artifacts — must match be0/src/initiative_db/models.py ApplicationArtifact
+-- New DBs: loaded by docker-compose postgres init (04_...).
+-- Existing DBs: run once, e.g.
+--   docker exec -i initiative-postgres psql -U initiative -d initiatives < be0/migrations/004_evidence_artifact_review.sql
+--   # or: psql "$INITIATIVE_DATABASE_URL" -f be0/migrations/004_evidence_artifact_review.sql
+
+ALTER TABLE application_artifacts
+  ADD COLUMN IF NOT EXISTS review_status TEXT,
+  ADD COLUMN IF NOT EXISTS reviewed_by UUID REFERENCES users (id) ON DELETE SET NULL,
+  ADD COLUMN IF NOT EXISTS reviewed_at TIMESTAMPTZ;
+
+CREATE INDEX IF NOT EXISTS idx_application_artifacts_review
+  ON application_artifacts (initiative_id, review_status);
@@ -0,0 +1,26 @@
+-- In-app notifications for applicants (admin adjudication → inbox).
+-- Best-effort insert after PUT/POST admin-result; full text duplicated for read UX.
+
+CREATE TABLE IF NOT EXISTS user_notifications (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  recipient_user_id UUID NOT NULL REFERENCES users(id) ON DELETE CASCADE,
+  type TEXT NOT NULL CHECK (type IN ('admin_application_decision')),
+  title TEXT NOT NULL,
+  body TEXT NOT NULL,
+  application_id TEXT NOT NULL,
+  related_initiative_id UUID REFERENCES initiatives(id) ON DELETE SET NULL,
+  source_admin_result_id UUID REFERENCES application_admin_results(id) ON DELETE SET NULL,
+  decision TEXT NOT NULL CHECK (decision IN ('approved','rejected')),
+  merit_category_label TEXT,
+  feedback_text TEXT NOT NULL DEFAULT '',
+  rationale_text TEXT,
+  read_at TIMESTAMPTZ,
+  created_at TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+
+CREATE INDEX IF NOT EXISTS user_notifications_inbox_idx
+  ON user_notifications (recipient_user_id, created_at DESC);
+
+CREATE INDEX IF NOT EXISTS user_notifications_unread_idx
+  ON user_notifications (recipient_user_id)
+  WHERE read_at IS NULL;
@@ -0,0 +1,33 @@
+-- Policy-sourced admin rows: safe to drop when email leaves AUTH_ADMIN_EMAILS (app reconciliation).
+-- Apply on existing DBs:  docker exec -i initiative-postgres psql -U initiative -d initiatives < be0/migrations/007_user_roles_email_policy_admin.sql
+-- Fresh docker-compose init: add this file as docker-entrypoint-initdb.d/07_*.sql
+
+ALTER TABLE user_roles ADD COLUMN IF NOT EXISTS admin_from_email_policy BOOLEAN NOT NULL DEFAULT FALSE;
+
+COMMENT ON COLUMN user_roles.admin_from_email_policy IS
+  'TRUE when admin was granted by email allow-list (AUTH_ADMIN_EMAILS). Reconciliation may DELETE this row if the user email is no longer in the list. FALSE preserves manually granted admin (future / exceptional).';
+
+-- One-time cleanup: remove admin for addresses not in the default institutional allow-list
+-- (must match default in auth_api._DEFAULT_POLICY_ADMIN_EMAILS when AUTH_ADMIN_EMAILS is unset).
+DELETE FROM user_roles ur
+USING users u
+WHERE ur.user_id = u.id
+  AND ur.role::text = 'admin'
+  AND lower(u.email::text) NOT IN (
+    'thaontt@ump.edu.vn',
+    'nltanh@ump.edu.vn',
+    'ldbaochau@ump.edu.vn',
+    'htchuong@ump.edu.vn'
+  );
+
+UPDATE user_roles ur
+SET admin_from_email_policy = TRUE
+FROM users u
+WHERE ur.user_id = u.id
+  AND ur.role::text = 'admin'
+  AND lower(u.email::text) IN (
+    'thaontt@ump.edu.vn',
+    'nltanh@ump.edu.vn',
+    'ldbaochau@ump.edu.vn',
+    'htchuong@ump.edu.vn'
+  );
@@ -0,0 +1,38 @@
+-- Unified append-only audit trail (see assets/docs/audit-log-implementation.md).
+-- Application role should be granted INSERT, SELECT only (configure per deployment).
+
+DO $$
+BEGIN
+    CREATE TYPE audit_action AS ENUM (
+        'create',
+        'read',
+        'update',
+        'delete',
+        'login',
+        'logout',
+        'login_failed'
+    );
+EXCEPTION
+    WHEN duplicate_object THEN NULL;
+END
+$$;
+
+CREATE TABLE IF NOT EXISTS audit_events (
+    id              BIGSERIAL PRIMARY KEY,
+    occurred_at     TIMESTAMPTZ NOT NULL DEFAULT now(),
+    actor_user_id   UUID REFERENCES users(id) ON DELETE SET NULL,
+    actor_email     TEXT NOT NULL,
+    actor_role      TEXT NOT NULL,
+    action          audit_action NOT NULL,
+    entity_type     TEXT NOT NULL,
+    entity_id       TEXT,
+    before          JSONB,
+    after           JSONB,
+    metadata        JSONB NOT NULL DEFAULT '{}'::jsonb,
+    request_id      UUID
+);
+
+CREATE INDEX IF NOT EXISTS idx_audit_actor_time   ON audit_events (actor_user_id, occurred_at DESC);
+CREATE INDEX IF NOT EXISTS idx_audit_entity       ON audit_events (entity_type, entity_id, occurred_at DESC);
+CREATE INDEX IF NOT EXISTS idx_audit_action_time  ON audit_events (action, occurred_at DESC);
+CREATE INDEX IF NOT EXISTS idx_audit_metadata_gin ON audit_events USING gin (metadata);
@@ -0,0 +1,35 @@
+-- Backup / canonical storage: official printable DOCX+PDF roles + explicit storage_kind.
+-- Apply: psql "$INITIATIVE_DATABASE_URL" -f migrations/009_backup_artifact_roles_storage_kind.sql
+
+ALTER TABLE application_artifacts DROP CONSTRAINT IF EXISTS application_artifacts_role_check;
+ALTER TABLE application_artifacts ADD CONSTRAINT application_artifacts_role_check CHECK (role IN (
+  'full_pdf',
+  'abstract',
+  'poster',
+  'textbook_evidence',
+  'research_evidence',
+  'technical_evidence',
+  'other',
+  'official_form_docx',
+  'official_form_pdf'
+));
+
+ALTER TABLE application_artifacts
+  ADD COLUMN IF NOT EXISTS storage_kind TEXT;
+
+UPDATE application_artifacts SET storage_kind = CASE
+  WHEN storage_uri LIKE 'http://%' OR storage_uri LIKE 'https://%' THEN 'external_url'
+  WHEN storage_uri LIKE '/submitted-initiatives/%' THEN 'filesystem'
+  WHEN role IN ('research_evidence', 'textbook_evidence', 'technical_evidence') THEN 'minio_attachments'
+  ELSE 'minio_exports'
+END
+WHERE storage_kind IS NULL;
+
+ALTER TABLE application_artifacts DROP CONSTRAINT IF EXISTS application_artifacts_storage_kind_check;
+ALTER TABLE application_artifacts ADD CONSTRAINT application_artifacts_storage_kind_check
+  CHECK (storage_kind IS NULL OR storage_kind IN (
+    'minio_exports',
+    'minio_attachments',
+    'filesystem',
+    'external_url'
+  ));
@@ -0,0 +1,114 @@
+-- User staff profiles (1:1 with users) — HR / verification workflow
+-- Apply: docker exec -i initiative-postgres psql -U initiative -d initiatives < be0/migrations/010_user_staff_profiles.sql
+
+DO $$ BEGIN
+  CREATE TYPE profile_verification_status AS ENUM ('draft', 'pending', 'verified', 'rejected');
+EXCEPTION WHEN duplicate_object THEN NULL;
+END $$;
+
+CREATE TABLE IF NOT EXISTS academic_titles (
+  code         TEXT PRIMARY KEY,
+  label_vi     TEXT NOT NULL,
+  label_en     TEXT NOT NULL,
+  sort_order   INTEGER NOT NULL DEFAULT 0,
+  active       BOOLEAN NOT NULL DEFAULT TRUE
+);
+
+INSERT INTO academic_titles (code, label_vi, label_en, sort_order) VALUES
+  ('professor', 'Giáo sư', 'Professor', 10),
+  ('associate_professor', 'Phó Giáo sư', 'Associate Professor', 20),
+  ('doctor_sc', 'Tiến sĩ', 'Doctor of Science', 30),
+  ('bsckii', 'BSCKII', 'Specialist level II', 35),
+  ('bscki', 'BSCKI', 'Specialist level I', 36),
+  ('master', 'Thạc sĩ', 'Master', 40),
+  ('doctor_md', 'Bác sĩ', 'Physician', 45),
+  ('pharmacist', 'Dược sĩ', 'Pharmacist', 46),
+  ('bachelor', 'Cử nhân', 'Bachelor', 50),
+  ('other', 'Khác (ghi rõ)', 'Other (specify)', 100)
+ON CONFLICT (code) DO NOTHING;
+
+CREATE TABLE IF NOT EXISTS user_staff_profiles (
+  user_id                       UUID PRIMARY KEY
+                                  REFERENCES users(id) ON DELETE CASCADE,
+
+  employee_id                   TEXT,
+  academic_title_code           TEXT REFERENCES academic_titles(code),
+  academic_title_other          TEXT,
+  unit_name_freetext            TEXT,
+  job_title                     TEXT,
+
+  profile_verification_status   profile_verification_status
+                                  NOT NULL DEFAULT 'draft',
+  verification_submitted_at     TIMESTAMPTZ,
+  verified_at                   TIMESTAMPTZ,
+  verified_by_user_id           UUID REFERENCES users(id),
+  rejection_reason              TEXT,
+
+  version                       INTEGER NOT NULL DEFAULT 1,
+  created_at                    TIMESTAMPTZ NOT NULL DEFAULT now(),
+  updated_at                    TIMESTAMPTZ NOT NULL DEFAULT now(),
+
+  CONSTRAINT employee_id_shape
+    CHECK (employee_id IS NULL OR employee_id ~ '^[A-Z0-9-]{3,32}$'),
+
+  CONSTRAINT academic_title_other_invariant CHECK (
+    CASE
+      WHEN academic_title_code IS NULL THEN academic_title_other IS NULL
+      WHEN academic_title_code = 'other' THEN
+        academic_title_other IS NOT NULL AND length(trim(academic_title_other)) > 0
+      ELSE academic_title_other IS NULL
+    END
+  ),
+
+  CONSTRAINT verified_requires_metadata CHECK (
+    profile_verification_status <> 'verified'
+    OR (verified_at IS NOT NULL AND verified_by_user_id IS NOT NULL)
+  ),
+
+  CONSTRAINT rejected_requires_reason CHECK (
+    profile_verification_status <> 'rejected'
+    OR (rejection_reason IS NOT NULL AND length(trim(rejection_reason)) > 0)
+  ),
+
+  CONSTRAINT non_terminal_clears_verification CHECK (
+    profile_verification_status NOT IN ('draft', 'pending')
+    OR (verified_at IS NULL AND verified_by_user_id IS NULL)
+  ),
+
+  CONSTRAINT rejected_clears_verification_metadata CHECK (
+    profile_verification_status <> 'rejected'
+    OR (verified_at IS NULL AND verified_by_user_id IS NULL)
+  ),
+
+  CONSTRAINT verified_clears_rejection CHECK (
+    profile_verification_status <> 'verified'
+    OR rejection_reason IS NULL
+  ),
+
+  CONSTRAINT job_title_length CHECK (
+    job_title IS NULL OR length(job_title) <= 120
+  )
+);
+
+CREATE UNIQUE INDEX IF NOT EXISTS ix_usp_employee_id_unique
+  ON user_staff_profiles (employee_id)
+  WHERE employee_id IS NOT NULL;
+
+CREATE INDEX IF NOT EXISTS ix_usp_pending_queue
+  ON user_staff_profiles (verification_submitted_at)
+  WHERE profile_verification_status = 'pending';
+
+CREATE INDEX IF NOT EXISTS ix_usp_verifier_activity
+  ON user_staff_profiles (verified_by_user_id, verified_at DESC)
+  WHERE verified_by_user_id IS NOT NULL;
+
+-- Backfill one row per existing user (draft, NULL fields)
+INSERT INTO user_staff_profiles (user_id, profile_verification_status)
+SELECT u.id, 'draft'::profile_verification_status
+FROM users u
+WHERE NOT EXISTS (
+  SELECT 1 FROM user_staff_profiles p WHERE p.user_id = u.id
+);
+
+COMMENT ON TABLE user_staff_profiles IS
+  'Institutional staff profile and verification state; scalars only — no MinIO.';
@@ -0,0 +1,19 @@
+-- Extend / refresh academic_titles for UMP staff profile dropdown (VN labels + BSCK codes).
+-- Apply after 010: psql … -f be0/migrations/011_academic_titles_vn.sql
+
+INSERT INTO academic_titles (code, label_vi, label_en, sort_order, active) VALUES
+  ('professor', 'Giáo sư', 'Professor', 10, TRUE),
+  ('associate_professor', 'Phó Giáo sư', 'Associate Professor', 20, TRUE),
+  ('doctor_sc', 'Tiến sĩ', 'Doctor of Science', 30, TRUE),
+  ('bsckii', 'BSCKII', 'Specialist level II', 35, TRUE),
+  ('bscki', 'BSCKI', 'Specialist level I', 36, TRUE),
+  ('master', 'Thạc sĩ', 'Master', 40, TRUE),
+  ('doctor_md', 'Bác sĩ', 'Physician', 45, TRUE),
+  ('pharmacist', 'Dược sĩ', 'Pharmacist', 46, TRUE),
+  ('bachelor', 'Cử nhân', 'Bachelor', 50, TRUE),
+  ('other', 'Khác (ghi rõ)', 'Other (specify)', 100, TRUE)
+ON CONFLICT (code) DO UPDATE SET
+  label_vi = EXCLUDED.label_vi,
+  label_en = EXCLUDED.label_en,
+  sort_order = EXCLUDED.sort_order,
+  active = EXCLUDED.active;
@@ -0,0 +1,19 @@
+-- Password reset tokens + JWT credential invalidation (see auth_api, auth_credential_middleware).
+-- Apply: docker exec -i initiative-postgres psql -U initiative -d initiatives < be0/migrations/012_password_reset.sql
+
+ALTER TABLE users ADD COLUMN IF NOT EXISTS credential_version INTEGER NOT NULL DEFAULT 0;
+
+COMMENT ON COLUMN users.credential_version IS
+  'Incremented on password change/reset. JWT ''cv'' claim must match or token is rejected.';
+
+CREATE TABLE IF NOT EXISTS password_reset_tokens (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  user_id UUID NOT NULL REFERENCES users(id) ON DELETE CASCADE,
+  token_hash TEXT NOT NULL UNIQUE,
+  expires_at TIMESTAMPTZ NOT NULL,
+  used_at TIMESTAMPTZ,
+  created_at TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+
+CREATE INDEX IF NOT EXISTS idx_password_reset_tokens_user_id ON password_reset_tokens(user_id);
+CREATE INDEX IF NOT EXISTS idx_password_reset_tokens_expires_at ON password_reset_tokens(expires_at);
@@ -0,0 +1,21 @@
+-- Email verification before login (see auth_api deliver_email_verification_email).
+-- Apply: docker exec -i initiative-postgres psql -U initiative -d initiatives < be0/migrations/013_email_verification.sql
+
+ALTER TABLE users ADD COLUMN IF NOT EXISTS email_verified BOOLEAN NOT NULL DEFAULT FALSE;
+
+UPDATE users SET email_verified = TRUE WHERE email_verified = FALSE;
+
+COMMENT ON COLUMN users.email_verified IS
+  'FALSE until user confirms institutional inbox via email link; login and API tokens require TRUE.';
+
+CREATE TABLE IF NOT EXISTS email_verification_tokens (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  user_id UUID NOT NULL REFERENCES users(id) ON DELETE CASCADE,
+  token_hash TEXT NOT NULL UNIQUE,
+  expires_at TIMESTAMPTZ NOT NULL,
+  used_at TIMESTAMPTZ,
+  created_at TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+
+CREATE INDEX IF NOT EXISTS idx_email_verification_tokens_user_id ON email_verification_tokens(user_id);
+CREATE INDEX IF NOT EXISTS idx_email_verification_tokens_expires_at ON email_verification_tokens(expires_at);
@@ -0,0 +1,20 @@
+-- Registration email verification via 6-digit OTP (replaces magic-link issuance on register).
+-- Apply after 013_email_verification.sql:
+--   docker exec -i initiative-postgres psql -U initiative -d initiatives < be0/migrations/014_registration_otp.sql
+
+CREATE TABLE IF NOT EXISTS registration_otp_codes (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  user_id UUID NOT NULL REFERENCES users(id) ON DELETE CASCADE,
+  otp_hash TEXT NOT NULL,
+  expires_at TIMESTAMPTZ NOT NULL,
+  failed_attempts INT NOT NULL DEFAULT 0,
+  used_at TIMESTAMPTZ,
+  created_at TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+
+CREATE INDEX IF NOT EXISTS idx_registration_otp_codes_user_pending
+  ON registration_otp_codes (user_id)
+  WHERE used_at IS NULL;
+
+COMMENT ON TABLE registration_otp_codes IS
+  'Hashed 6-digit OTP for register verification; pending rows deleted when superseded by resend.';
@@ -0,0 +1,24 @@
+-- Admin-managed document templates: a .docx (stored in MinIO bucket initiative-templates)
+-- plus its extracted Jinja placeholder fields. Applicants render a filled PDF by template id.
+-- Apply after 014_registration_otp.sql:
+--   docker exec -i initiative-postgres psql -U initiative -d initiatives < be0/migrations/015_document_templates.sql
+
+CREATE TABLE IF NOT EXISTS document_templates (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  name TEXT NOT NULL,
+  description TEXT,
+  storage_key TEXT NOT NULL,
+  original_filename TEXT,
+  content_sha256 TEXT,
+  fields JSONB NOT NULL DEFAULT '[]'::jsonb,
+  is_active BOOLEAN NOT NULL DEFAULT TRUE,
+  created_by UUID REFERENCES users(id) ON DELETE SET NULL,
+  created_at TIMESTAMPTZ NOT NULL DEFAULT now(),
+  updated_at TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+
+CREATE INDEX IF NOT EXISTS idx_document_templates_active
+  ON document_templates (is_active, created_at DESC);
+
+COMMENT ON TABLE document_templates IS
+  'Admin-managed DOCX templates (file in MinIO initiative-templates) with extracted Jinja placeholder fields. Applicants render filled PDFs by template id.';
@@ -0,0 +1,133 @@
+-- Research-project proposals (Thuyết minh đề tài, Mẫu III.06-TM.ĐTUD) + the PI "cockpit" entities.
+-- A proposal row IS the project across its lifecycle: draft -> submitted -> approved | rejected.
+-- On approval the cockpit unlocks; child tables (members/datasets/models/assets/milestones) hang off it.
+-- Owner+admin authz (v1): a project is owned by owner_user_id; admins may review/approve/reject.
+-- Apply after 015_document_templates.sql:
+--   docker exec -i initiative-postgres psql -U initiative -d initiatives < be0/migrations/016_research_projects.sql
+
+CREATE TABLE IF NOT EXISTS research_projects (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  owner_user_id UUID NOT NULL REFERENCES users(id) ON DELETE CASCADE,
+  status TEXT NOT NULL DEFAULT 'draft' CHECK (status IN ('draft','submitted','approved','rejected')),
+  code TEXT,
+  title TEXT NOT NULL DEFAULT '',
+  level TEXT NOT NULL DEFAULT '',
+  pi_name TEXT NOT NULL DEFAULT '',
+  period_months INTEGER,
+  budget_total NUMERIC(14,2),
+  content JSONB NOT NULL DEFAULT '{}'::jsonb,
+  submitted_at TIMESTAMPTZ,
+  reviewed_by UUID REFERENCES users(id) ON DELETE SET NULL,
+  reviewed_at TIMESTAMPTZ,
+  review_note TEXT,
+  created_at TIMESTAMPTZ NOT NULL DEFAULT now(),
+  updated_at TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+
+CREATE INDEX IF NOT EXISTS idx_research_projects_owner ON research_projects (owner_user_id, created_at DESC);
+CREATE INDEX IF NOT EXISTS idx_research_projects_status ON research_projects (status, created_at DESC);
+
+CREATE TABLE IF NOT EXISTS research_project_members (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  project_id UUID NOT NULL REFERENCES research_projects(id) ON DELETE CASCADE,
+  sort_order INTEGER NOT NULL DEFAULT 0,
+  name TEXT NOT NULL DEFAULT '',
+  role TEXT NOT NULL DEFAULT '',
+  access TEXT NOT NULL DEFAULT '',
+  org TEXT NOT NULL DEFAULT '',
+  email TEXT NOT NULL DEFAULT '',
+  months INTEGER,
+  tasks TEXT NOT NULL DEFAULT '',
+  status TEXT NOT NULL DEFAULT '',
+  user_id UUID REFERENCES users(id) ON DELETE SET NULL,
+  created_at TIMESTAMPTZ NOT NULL DEFAULT now(),
+  updated_at TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+CREATE INDEX IF NOT EXISTS idx_research_project_members_project ON research_project_members (project_id, sort_order);
+
+CREATE TABLE IF NOT EXISTS research_project_datasets (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  project_id UUID NOT NULL REFERENCES research_projects(id) ON DELETE CASCADE,
+  sort_order INTEGER NOT NULL DEFAULT 0,
+  name TEXT NOT NULL DEFAULT '',
+  type TEXT NOT NULL DEFAULT '',
+  records INTEGER,
+  source TEXT NOT NULL DEFAULT '',
+  sensitivity TEXT NOT NULL DEFAULT '',
+  ethics TEXT NOT NULL DEFAULT '',
+  owner TEXT NOT NULL DEFAULT '',
+  status TEXT NOT NULL DEFAULT '',
+  created_at TIMESTAMPTZ NOT NULL DEFAULT now(),
+  updated_at TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+CREATE INDEX IF NOT EXISTS idx_research_project_datasets_project ON research_project_datasets (project_id, sort_order);
+
+CREATE TABLE IF NOT EXISTS research_project_models (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  project_id UUID NOT NULL REFERENCES research_projects(id) ON DELETE CASCADE,
+  sort_order INTEGER NOT NULL DEFAULT 0,
+  name TEXT NOT NULL DEFAULT '',
+  task TEXT NOT NULL DEFAULT '',
+  framework TEXT NOT NULL DEFAULT '',
+  version TEXT NOT NULL DEFAULT '',
+  dataset TEXT NOT NULL DEFAULT '',
+  auc NUMERIC(6,4),
+  sensitivity NUMERIC(6,4),
+  specificity NUMERIC(6,4),
+  accuracy NUMERIC(6,4),
+  owner TEXT NOT NULL DEFAULT '',
+  notes TEXT NOT NULL DEFAULT '',
+  status TEXT NOT NULL DEFAULT '',
+  created_at TIMESTAMPTZ NOT NULL DEFAULT now(),
+  updated_at TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+CREATE INDEX IF NOT EXISTS idx_research_project_models_project ON research_project_models (project_id, sort_order);
+
+CREATE TABLE IF NOT EXISTS research_project_assets (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  project_id UUID NOT NULL REFERENCES research_projects(id) ON DELETE CASCADE,
+  sort_order INTEGER NOT NULL DEFAULT 0,
+  name TEXT NOT NULL DEFAULT '',
+  category TEXT NOT NULL DEFAULT '',
+  acquisition TEXT NOT NULL DEFAULT '',
+  value NUMERIC(14,2),
+  owner TEXT NOT NULL DEFAULT '',
+  notes TEXT NOT NULL DEFAULT '',
+  status TEXT NOT NULL DEFAULT '',
+  created_at TIMESTAMPTZ NOT NULL DEFAULT now(),
+  updated_at TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+CREATE INDEX IF NOT EXISTS idx_research_project_assets_project ON research_project_assets (project_id, sort_order);
+
+CREATE TABLE IF NOT EXISTS research_project_milestones (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  project_id UUID NOT NULL REFERENCES research_projects(id) ON DELETE CASCADE,
+  sort_order INTEGER NOT NULL DEFAULT 0,
+  title TEXT NOT NULL DEFAULT '',
+  deliverable TEXT NOT NULL DEFAULT '',
+  start_period TEXT NOT NULL DEFAULT '',
+  end_period TEXT NOT NULL DEFAULT '',
+  owner TEXT NOT NULL DEFAULT '',
+  budget NUMERIC(14,2),
+  progress INTEGER NOT NULL DEFAULT 0,
+  status TEXT NOT NULL DEFAULT '',
+  created_at TIMESTAMPTZ NOT NULL DEFAULT now(),
+  updated_at TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+CREATE INDEX IF NOT EXISTS idx_research_project_milestones_project ON research_project_milestones (project_id, sort_order);
+
+CREATE TABLE IF NOT EXISTS research_project_audit (
+  id BIGSERIAL PRIMARY KEY,
+  project_id UUID NOT NULL REFERENCES research_projects(id) ON DELETE CASCADE,
+  occurred_at TIMESTAMPTZ NOT NULL DEFAULT now(),
+  actor_user_id UUID REFERENCES users(id) ON DELETE SET NULL,
+  actor_name TEXT NOT NULL DEFAULT '',
+  role_label TEXT NOT NULL DEFAULT '',
+  action TEXT NOT NULL,
+  subject TEXT NOT NULL DEFAULT '',
+  detail TEXT NOT NULL DEFAULT ''
+);
+CREATE INDEX IF NOT EXISTS idx_research_project_audit_project ON research_project_audit (project_id, occurred_at DESC);
+
+COMMENT ON TABLE research_projects IS
+  'Research-project proposals (Thuyet minh de tai) that become managed projects on approval. Owner and admin authz. Content JSONB holds the full proposal form. Child research_project_* tables hold cockpit entities.';
@@ -0,0 +1,76 @@
+-- ImageHub: content-addressed imaging dataset versioning (milestone 1 walking skeleton).
+-- A dataset is owned by a user (investigator/PI). Files are stored as content-addressed,
+-- globally deduped blobs in MinIO (one imagehub_blobs row per distinct sha256). The current
+-- working file set lives in imagehub_dataset_files; a version freezes a manifest snapshot.
+-- Admin sees all datasets (clinical data repository); owners see their own (research data).
+-- Apply after 016_research_projects.sql:
+--   docker exec -i initiative-postgres psql -U initiative -d initiatives < be0/migrations/017_imagehub_datasets.sql
+
+CREATE TABLE IF NOT EXISTS imagehub_datasets (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  owner_user_id UUID NOT NULL REFERENCES users(id) ON DELETE CASCADE,
+  name TEXT NOT NULL DEFAULT '',
+  slug TEXT NOT NULL DEFAULT '',
+  description TEXT NOT NULL DEFAULT '',
+  visibility TEXT NOT NULL DEFAULT 'private' CHECK (visibility IN ('private','internal','public')),
+  modality_tags JSONB NOT NULL DEFAULT '[]'::jsonb,
+  default_branch TEXT NOT NULL DEFAULT 'main',
+  created_at TIMESTAMPTZ NOT NULL DEFAULT now(),
+  updated_at TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+CREATE INDEX IF NOT EXISTS idx_imagehub_datasets_owner ON imagehub_datasets (owner_user_id, created_at DESC);
+
+-- Globally content-addressed blob registry: identical bytes across datasets dedupe to one row.
+CREATE TABLE IF NOT EXISTS imagehub_blobs (
+  sha256 TEXT PRIMARY KEY,
+  size_bytes BIGINT NOT NULL DEFAULT 0,
+  media_type TEXT NOT NULL DEFAULT 'application/octet-stream',
+  storage_bucket TEXT NOT NULL DEFAULT '',
+  storage_key TEXT NOT NULL DEFAULT '',
+  created_at TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+
+-- Current working file set on a dataset default branch (one row per logical path).
+CREATE TABLE IF NOT EXISTS imagehub_dataset_files (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  dataset_id UUID NOT NULL REFERENCES imagehub_datasets(id) ON DELETE CASCADE,
+  logical_path TEXT NOT NULL DEFAULT '',
+  blob_sha256 TEXT NOT NULL REFERENCES imagehub_blobs(sha256) ON DELETE RESTRICT,
+  size_bytes BIGINT NOT NULL DEFAULT 0,
+  media_type TEXT NOT NULL DEFAULT 'application/octet-stream',
+  imaging_meta JSONB NOT NULL DEFAULT '{}'::jsonb,
+  uploaded_by UUID REFERENCES users(id) ON DELETE SET NULL,
+  created_at TIMESTAMPTZ NOT NULL DEFAULT now(),
+  updated_at TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+CREATE UNIQUE INDEX IF NOT EXISTS uq_imagehub_dataset_files_path ON imagehub_dataset_files (dataset_id, logical_path);
+
+-- Frozen version snapshots (the versioning spine; DAG-ready via parent_version_id).
+CREATE TABLE IF NOT EXISTS imagehub_versions (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  dataset_id UUID NOT NULL REFERENCES imagehub_datasets(id) ON DELETE CASCADE,
+  seq INTEGER NOT NULL DEFAULT 1,
+  message TEXT NOT NULL DEFAULT '',
+  manifest JSONB NOT NULL DEFAULT '[]'::jsonb,
+  parent_version_id UUID REFERENCES imagehub_versions(id) ON DELETE SET NULL,
+  author_user_id UUID REFERENCES users(id) ON DELETE SET NULL,
+  created_at TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+CREATE UNIQUE INDEX IF NOT EXISTS uq_imagehub_versions_seq ON imagehub_versions (dataset_id, seq);
+
+-- Append-only audit trail per dataset.
+CREATE TABLE IF NOT EXISTS imagehub_dataset_audit (
+  id BIGSERIAL PRIMARY KEY,
+  dataset_id UUID NOT NULL REFERENCES imagehub_datasets(id) ON DELETE CASCADE,
+  occurred_at TIMESTAMPTZ NOT NULL DEFAULT now(),
+  actor_user_id UUID REFERENCES users(id) ON DELETE SET NULL,
+  actor_name TEXT NOT NULL DEFAULT '',
+  role_label TEXT NOT NULL DEFAULT '',
+  action TEXT NOT NULL,
+  subject TEXT NOT NULL DEFAULT '',
+  detail TEXT NOT NULL DEFAULT ''
+);
+CREATE INDEX IF NOT EXISTS idx_imagehub_dataset_audit_dataset ON imagehub_dataset_audit (dataset_id, occurred_at DESC);
+
+COMMENT ON TABLE imagehub_datasets IS
+  'ImageHub content-addressed imaging datasets. Owner and admin authz. Files dedupe into imagehub_blobs by sha256 — imagehub_versions freezes a manifest snapshot.';
@@ -0,0 +1,21 @@
+-- ImageHub: link organ-segmentation masks to their parent image file (Phase D).
+-- A mask file (file_kind='segmentation') points at the image it segments via a
+-- self-referential parent_file_id (e.g. an organ mask of ct.nii.gz); organ_label
+-- names the organ. Regular files stay file_kind='image'. Idempotent (ADD COLUMN IF
+-- NOT EXISTS) so the startup runner can apply it to volumes that predate it.
+-- Apply after 017_imagehub_datasets.sql (no semicolons inside comments — the runner
+-- splitter is naive):
+--   docker exec -i initiative-postgres psql -U initiative -d initiatives < be0/migrations/018_imagehub_segmentation_links.sql
+
+ALTER TABLE imagehub_dataset_files
+  ADD COLUMN IF NOT EXISTS file_kind TEXT NOT NULL DEFAULT 'image' CHECK (file_kind IN ('image','segmentation'));
+
+ALTER TABLE imagehub_dataset_files
+  ADD COLUMN IF NOT EXISTS parent_file_id UUID REFERENCES imagehub_dataset_files(id) ON DELETE CASCADE;
+
+ALTER TABLE imagehub_dataset_files
+  ADD COLUMN IF NOT EXISTS organ_label TEXT NOT NULL DEFAULT '';
+
+-- List all masks of an image efficiently.
+CREATE INDEX IF NOT EXISTS idx_imagehub_dataset_files_parent
+  ON imagehub_dataset_files (parent_file_id);
@@ -0,0 +1,53 @@
+-- ImageHub: Cloud Import — storage methods + external (referenced, not copied) dataset files.
+-- A storage method holds verified credentials (config_encrypted, never returned to the client)
+-- for an external bucket (S3/GCS/Azure). A dataset file is then EITHER a local content-addressed
+-- blob (blob_sha256 set) OR an external reference (storage_method_id + external_path set) that
+-- streams from the bucket and is never copied to our servers (privacy rule C4). Idempotent
+-- (CREATE/ADD ... IF NOT EXISTS) so the startup runner can apply it to volumes that predate it.
+-- Apply after 018 (no semicolons inside comments or string literals — the runner splitter is naive):
+--   docker exec -i initiative-postgres psql -U initiative -d initiatives < be0/migrations/019_imagehub_cloud_import.sql
+
+CREATE TABLE IF NOT EXISTS imagehub_storage_methods (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  owner_id UUID NOT NULL REFERENCES users(id) ON DELETE CASCADE,
+  name TEXT NOT NULL,
+  provider TEXT NOT NULL CHECK (provider IN ('s3','gcs','azure')),
+  access_mode TEXT NOT NULL DEFAULT 'read' CHECK (access_mode IN ('read','readwrite')),
+  bucket TEXT NOT NULL,
+  region TEXT,
+  config_encrypted TEXT NOT NULL,
+  verification_status TEXT NOT NULL DEFAULT 'pending' CHECK (verification_status IN ('pending','verified','failed')),
+  verification_reason TEXT,
+  verification_checked_at TIMESTAMPTZ,
+  created_by UUID REFERENCES users(id) ON DELETE SET NULL,
+  created_at TIMESTAMPTZ NOT NULL DEFAULT now(),
+  updated_at TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+
+CREATE INDEX IF NOT EXISTS idx_imagehub_storage_methods_owner
+  ON imagehub_storage_methods (owner_id);
+
+-- Allow a dataset file to be an external reference instead of a local blob. Existing rows keep
+-- blob_sha256 set and the new columns NULL, so they satisfy the local-blob branch of the CHECK.
+ALTER TABLE imagehub_dataset_files
+  ALTER COLUMN blob_sha256 DROP NOT NULL;
+
+ALTER TABLE imagehub_dataset_files
+  ADD COLUMN IF NOT EXISTS storage_method_id UUID REFERENCES imagehub_storage_methods(id) ON DELETE RESTRICT;
+
+ALTER TABLE imagehub_dataset_files
+  ADD COLUMN IF NOT EXISTS external_path TEXT;
+
+-- A file is EITHER a local content-addressed blob OR an external reference, never both or neither.
+ALTER TABLE imagehub_dataset_files
+  DROP CONSTRAINT IF EXISTS ck_imagehub_file_storage_mode;
+
+ALTER TABLE imagehub_dataset_files
+  ADD CONSTRAINT ck_imagehub_file_storage_mode CHECK (
+    (blob_sha256 IS NOT NULL AND storage_method_id IS NULL AND external_path IS NULL)
+    OR
+    (blob_sha256 IS NULL AND storage_method_id IS NOT NULL AND external_path IS NOT NULL)
+  );
+
+CREATE INDEX IF NOT EXISTS idx_imagehub_dataset_files_storage_method
+  ON imagehub_dataset_files (storage_method_id);
@@ -0,0 +1,26 @@
+-- ImageHub: labeling-pipeline stages on a dataset (Label -> Review_1 -> Review_2 ...). Each stage
+-- has a kind (label/review), an order (seq), an optional review_percent (review stages only), and
+-- an auto_assign flag (the "Automatic Task Assignment" toggle). Idempotent (CREATE ... IF NOT
+-- EXISTS) so the startup runner can apply it to volumes that predate it. Apply after 019 (no
+-- semicolons inside comments or string literals — the runner splitter is naive):
+--   docker exec -i initiative-postgres psql -U initiative -d initiatives < be0/migrations/020_imagehub_dataset_stages.sql
+
+CREATE TABLE IF NOT EXISTS imagehub_dataset_stages (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  dataset_id UUID NOT NULL REFERENCES imagehub_datasets(id) ON DELETE CASCADE,
+  name TEXT NOT NULL,
+  kind TEXT NOT NULL DEFAULT 'label' CHECK (kind IN ('label','review')),
+  seq INTEGER NOT NULL DEFAULT 0,
+  review_percent INTEGER CHECK (review_percent IS NULL OR (review_percent >= 0 AND review_percent <= 100)),
+  auto_assign BOOLEAN NOT NULL DEFAULT TRUE,
+  created_at TIMESTAMPTZ NOT NULL DEFAULT now(),
+  updated_at TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+
+-- Stages of a dataset, in pipeline order.
+CREATE INDEX IF NOT EXISTS idx_imagehub_dataset_stages_dataset
+  ON imagehub_dataset_stages (dataset_id, seq);
+
+-- A stage name is unique within its dataset.
+CREATE UNIQUE INDEX IF NOT EXISTS uq_imagehub_dataset_stages_name
+  ON imagehub_dataset_stages (dataset_id, name);
@@ -0,0 +1,37 @@
+-- ImageHub: per-file work TASKS that flow through a dataset's pipeline stages (single-user MVP).
+-- A task is a NEW join row (one per dataset file) carrying its pipeline position (current_stage_id
+-- + pipeline_state), per-user queue status, assignee, priority, and the Ground-Truth reference flag.
+-- The file row itself (imagehub_dataset_files) stays a pure storage record. Membership / multi-labeler
+-- assignment is a later phase, so for now task access reuses the dataset owner-or-admin gate.
+-- Idempotent (CREATE ... IF NOT EXISTS) so the startup runner can apply it to volumes that predate it.
+-- Apply after 020 (no semicolons inside comments or string literals — the runner splitter is naive):
+--   docker exec -i initiative-postgres psql -U initiative -d initiatives < be0/migrations/021_imagehub_task_pipeline.sql
+
+CREATE TABLE IF NOT EXISTS imagehub_tasks (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  dataset_id UUID NOT NULL REFERENCES imagehub_datasets(id) ON DELETE CASCADE,
+  dataset_file_id UUID NOT NULL REFERENCES imagehub_dataset_files(id) ON DELETE CASCADE,
+  name TEXT NOT NULL DEFAULT '',
+  current_stage_id UUID REFERENCES imagehub_dataset_stages(id) ON DELETE SET NULL,
+  pipeline_state TEXT NOT NULL DEFAULT 'inLabel' CHECK (pipeline_state IN ('inLabel','inReview','groundTruth','issue')),
+  queue_status TEXT NOT NULL DEFAULT 'assigned' CHECK (queue_status IN ('assigned','saved','pendingFinalization','skipped')),
+  assignee_user_id UUID REFERENCES users(id) ON DELETE SET NULL,
+  assignment_mode TEXT NOT NULL DEFAULT 'auto' CHECK (assignment_mode IN ('auto','manual')),
+  priority DOUBLE PRECISION NOT NULL DEFAULT 0 CHECK (priority >= 0 AND priority <= 1),
+  is_reference_standard BOOLEAN NOT NULL DEFAULT FALSE,
+  skipped_seq BIGINT,
+  created_at TIMESTAMPTZ NOT NULL DEFAULT now(),
+  updated_at TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+
+-- One task per file (MVP simplification — droppable later for multi-task-per-file).
+CREATE UNIQUE INDEX IF NOT EXISTS uq_imagehub_tasks_file
+  ON imagehub_tasks (dataset_file_id);
+
+-- Queue scan: a dataset's tasks at a given stage and status, highest priority first.
+CREATE INDEX IF NOT EXISTS idx_imagehub_tasks_queue
+  ON imagehub_tasks (dataset_id, current_stage_id, queue_status, priority DESC);
+
+-- A user's personal labeling queue across datasets.
+CREATE INDEX IF NOT EXISTS idx_imagehub_tasks_assignee
+  ON imagehub_tasks (assignee_user_id, queue_status);
@@ -0,0 +1,8 @@
+-- ImageHub: a task's labeler annotations (bbox / points / pen / brush / polygon) stored as JSON.
+-- The shared viewer's annotation overlay emits normalized [0..1] vector geometry per slice — small
+-- JSON, persisted on the task so the AnnotationTool can load + save a labeler's work. Idempotent
+-- (ADD COLUMN IF NOT EXISTS) so the startup runner can apply it to volumes that predate it. Apply
+-- after 021 (no semicolons inside comments or string literals — the runner splitter is naive):
+--   docker exec -i initiative-postgres psql -U initiative -d initiatives < be0/migrations/022_imagehub_task_annotations.sql
+
+ALTER TABLE imagehub_tasks ADD COLUMN IF NOT EXISTS annotations JSONB NOT NULL DEFAULT '[]'::jsonb;
@@ -0,0 +1,23 @@
+-- ImageHub: dataset membership — lets users other than the owner work a dataset's tasks
+-- (multi-labeler). MVP treats all members as labelers: they view the dataset and work tasks
+-- assigned to them, while dataset / stage / settings management stays with the owner + platform
+-- admins. The role column is reserved for a future project-admin tier. Idempotent. Apply after 022
+-- (no semicolons inside comments or string literals — the runner splitter is naive):
+--   docker exec -i initiative-postgres psql -U initiative -d initiatives < be0/migrations/023_imagehub_dataset_members.sql
+
+CREATE TABLE IF NOT EXISTS imagehub_dataset_members (
+  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
+  dataset_id UUID NOT NULL REFERENCES imagehub_datasets(id) ON DELETE CASCADE,
+  user_id UUID NOT NULL REFERENCES users(id) ON DELETE CASCADE,
+  role TEXT NOT NULL DEFAULT 'member' CHECK (role IN ('project_admin','member')),
+  added_by UUID REFERENCES users(id) ON DELETE SET NULL,
+  created_at TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+
+-- One membership per user per dataset.
+CREATE UNIQUE INDEX IF NOT EXISTS uq_imagehub_dataset_members_user
+  ON imagehub_dataset_members (dataset_id, user_id);
+
+-- "Datasets I am a member of" lookup (the member's dataset list).
+CREATE INDEX IF NOT EXISTS idx_imagehub_dataset_members_user
+  ON imagehub_dataset_members (user_id);
@@ -0,0 +1,13 @@
+-- ImageHub: link a dataset to a research project (the "workspace" superstructure). Nullable,
+-- so existing datasets stay unlinked and a dataset can still exist standalone. A dataset created
+-- from a project cockpit attaches to that project. ON DELETE SET NULL so deleting a project
+-- orphans its datasets rather than dropping the imaging data. Idempotent. Apply after 023
+-- (no semicolons inside comments or string literals — the runner splitter is naive):
+--   docker exec -i initiative-postgres psql -U initiative -d initiatives < be0/migrations/024_imagehub_dataset_project_link.sql
+
+ALTER TABLE imagehub_datasets
+  ADD COLUMN IF NOT EXISTS research_project_id UUID REFERENCES research_projects(id) ON DELETE SET NULL;
+
+-- "Datasets in this project" lookup (the project-scoped dataset list).
+CREATE INDEX IF NOT EXISTS idx_imagehub_datasets_research_project
+  ON imagehub_datasets (research_project_id);
@@ -0,0 +1,25 @@
+-- ImageHub: structured review decisions. The task pipeline applies accept/acceptWithCorrections/
+-- reject moves, but until now the verdict survived only as a free-text Vietnamese audit string —
+-- not queryable, no reviewer/stage FK, no reject reason. This append-only table records every
+-- review decision so review history + per-reviewer accept/reject counters become real. Idempotent.
+-- Apply after 024 (no semicolons inside comments or string literals — the runner splitter is naive):
+--   docker exec -i initiative-postgres psql -U initiative -d initiatives < be0/migrations/025_imagehub_task_review_events.sql
+
+CREATE TABLE IF NOT EXISTS imagehub_task_review_events (
+  id BIGSERIAL PRIMARY KEY,
+  dataset_id UUID NOT NULL REFERENCES imagehub_datasets(id) ON DELETE CASCADE,
+  task_id UUID NOT NULL REFERENCES imagehub_tasks(id) ON DELETE CASCADE,
+  stage_id UUID REFERENCES imagehub_dataset_stages(id) ON DELETE SET NULL,
+  reviewer_user_id UUID REFERENCES users(id) ON DELETE SET NULL,
+  decision TEXT NOT NULL CHECK (decision IN ('accept','acceptWithCorrections','reject')),
+  note TEXT NOT NULL DEFAULT '',
+  created_at TIMESTAMPTZ NOT NULL DEFAULT now()
+);
+
+-- Per-reviewer counters over a date window (the productivity panel query).
+CREATE INDEX IF NOT EXISTS idx_imagehub_review_events_reviewer
+  ON imagehub_task_review_events (dataset_id, reviewer_user_id, created_at);
+
+-- A task's review history (chronological).
+CREATE INDEX IF NOT EXISTS idx_imagehub_review_events_task
+  ON imagehub_task_review_events (task_id, created_at);
@@ -0,0 +1,21 @@
+-- ImageHub: persist the relative folder path of each uploaded file (Option B — real folders inside
+-- a dataset). Until now logical_path was basename-flattened, so an uploaded directory structure
+-- (e.g. the nnU-Net imagesTr/labelsTr layout) was lost once files reached MinIO. folder_path keeps
+-- the relative directory so the dataset browser can render a real folder tree and the structure
+-- round-trips. The working-file natural key moves from (dataset_id, logical_path) to
+-- (dataset_id, folder_path, logical_path) so two files sharing a basename in different folders no
+-- longer collide and silently merge. Existing rows default folder_path to the empty string, so the
+-- new key stays unique wherever the old one was. Idempotent.
+-- Apply after 025 (no semicolons inside comments or string literals — the runner splitter is naive):
+--   docker exec -i initiative-postgres psql -U initiative -d initiatives < be0/migrations/026_imagehub_file_folder_path.sql
+
+ALTER TABLE imagehub_dataset_files
+  ADD COLUMN IF NOT EXISTS folder_path TEXT NOT NULL DEFAULT '';
+
+DROP INDEX IF EXISTS uq_imagehub_dataset_files_path;
+
+CREATE UNIQUE INDEX IF NOT EXISTS uq_imagehub_dataset_files_folder_path
+  ON imagehub_dataset_files (dataset_id, folder_path, logical_path);
+
+CREATE INDEX IF NOT EXISTS idx_imagehub_dataset_files_folder
+  ON imagehub_dataset_files (dataset_id, folder_path);
@@ -0,0 +1,12 @@
+-- ImageHub: per-dataset value to name label map for multi-label segmentation masks. A multi-label
+-- labelsTr/<case>.nii.gz encodes each organ or structure as an integer voxel value (1, 2, 3 …). Until
+-- now the viewer named those values from a fixed TotalSegmentator-v2 117-class map, so a non
+-- TotalSegmentator dataset (KiTS = 1 kidney / 2 tumor / 3 cyst, or any custom nnU-Net labels) showed
+-- confidently-wrong organ names. label_map stores the dataset own value to name mapping (a JSON object
+-- with string keys), so the organ panel labels each overlay correctly and a user can edit them. The
+-- empty default keeps the TotalSegmentator fallback for datasets without a map. Idempotent.
+-- Apply after 026 (no semicolons inside comments or string literals — the runner splitter is naive):
+--   docker exec -i initiative-postgres psql -U initiative -d initiatives < be0/migrations/027_imagehub_dataset_label_map.sql
+
+ALTER TABLE imagehub_datasets
+  ADD COLUMN IF NOT EXISTS label_map JSONB NOT NULL DEFAULT '{}'::jsonb;
@@ -0,0 +1,6 @@
+# Test-only dependencies for CI (not installed in the runtime image).
+# be0 tests are a mix of unittest.TestCase (incl. IsolatedAsyncioTestCase) and
+# pytest-style; pytest runs both. pytest-asyncio covers the pytest async tests.
+-r requirements.txt
+pytest>=8,<9
+pytest-asyncio>=0.23,<0.24
@@ -0,0 +1,43 @@
+uvicorn[standard]
+httpx
+sqlalchemy[asyncio]>=2.0
+asyncpg>=0.29
+greenlet>=3.0
+argon2-cffi>=23.1.0
+PyJWT>=2.8.0
+ollama
+fastapi
+asyncio
+python-multipart
+
+langchain
+langchain-core
+langgraph
+
+langchain-community
+sentence-transformers
+huggingface
+scikit-learn
+
+neo4j
+
+nltk
+rake-nltk
+pypdf
+pydantic
+pydantic-settings
+aioboto3
+zipstream-ng
+boto3
+numpy
+pandas
+
+pyvi
+docling
+pymupdf
+docxtpl>=0.16
+openpyxl>=3.1.0
+
+# ImageHub: best-effort imaging metadata sniff (DICOM / NIfTI). See src/imagehub_routes.py.
+pydicom
+nibabel
@@ -0,0 +1,93 @@
+"""
+Script to add the 10 UMP innovation ideas to the vector database
+"""
+import asyncio
+import sys
+from pathlib import Path
+
+# Add parent directory to path
+sys.path.insert(0, str(Path(__file__).parent.parent))
+
+from src.infrastructure.vector_db.qdrant_service import get_qdrant_service
+
+UMP_IDEAS = [
+    {
+        "title": "Nền tảng Trợ lý AI học tập lâm sàng (Clinical AI Tutor)",
+        "description": "Ứng dụng AI đóng vai trò trợ giảng cho sinh viên y, hỗ trợ phân tích ca bệnh giả lập, giải thích cận lâm sàng, và gợi ý chẩn đoán theo phác đồ Việt Nam.",
+        "category": "Giáo dục - AI"
+    },
+    {
+        "title": "Hệ thống bệnh án điện tử học thuật (Academic EMR Sandbox)",
+        "description": "Môi trường EMR mô phỏng cho đào tạo và nghiên cứu, cho phép sinh viên và giảng viên thực hành nhập – phân tích – khai thác dữ liệu y khoa mà không ảnh hưởng dữ liệu bệnh nhân thật.",
+        "category": "Giáo dục - Chuyển đổi số"
+    },
+    {
+        "title": "Trung tâm mô phỏng y khoa bằng AR/VR & Digital Twin",
+        "description": "Xây dựng phòng lab mô phỏng phẫu thuật, cấp cứu, và quy trình điều trị bằng AR/VR, kết hợp mô hình \"digital twin\" của cơ thể người phục vụ đào tạo nâng cao.",
+        "category": "Giáo dục - AR/VR"
+    },
+    {
+        "title": "Chương trình Y tế cộng đồng số cho vùng sâu vùng xa",
+        "description": "Kết hợp telehealth, trợ lý ảo y tế (agentic care) và AI sàng lọc sớm bệnh không lây (NCD) cho người dân vùng nông thôn, miền núi và hải đảo.",
+        "category": "Tác động xã hội - Telehealth"
+    },
+    {
+        "title": "Nền tảng nghiên cứu AI y sinh dùng chung (UMP AI Research Hub)",
+        "description": "Cung cấp hạ tầng GPU, kho dữ liệu y khoa ẩn danh, và công cụ phân tích AI cho giảng viên – nghiên cứu sinh – startup hợp tác nghiên cứu.",
+        "category": "Nghiên cứu - AI"
+    },
+    {
+        "title": "Hệ thống theo dõi và dự báo sức khỏe sinh viên & nhân viên y tế",
+        "description": "Ứng dụng phân tích dữ liệu và AI để phát hiện sớm stress, burnout, và vấn đề sức khỏe tâm thần trong cộng đồng sinh viên và nhân viên y tế.",
+        "category": "Tác động xã hội - Sức khỏe"
+    },
+    {
+        "title": "Vườn ươm khởi nghiệp công nghệ y sinh (MedTech Incubator)",
+        "description": "Hỗ trợ sinh viên, bác sĩ và giảng viên phát triển startup MedTech, HealthTech, AI y tế thông qua mentoring, quỹ seed và kết nối bệnh viện – doanh nghiệp.",
+        "category": "Khởi nghiệp - MedTech"
+    },
+    {
+        "title": "Hệ thống quản lý chất lượng đào tạo và kiểm định số",
+        "description": "Số hóa toàn bộ quy trình đảm bảo chất lượng nội bộ (IQA), đánh giá chương trình đào tạo, và chuẩn hóa theo tiêu chuẩn quốc tế (WFME, AUN-QA).",
+        "category": "Giáo dục - Quản lý chất lượng"
+    },
+    {
+        "title": "Nền tảng dữ liệu lớn phòng chống dịch và bệnh không lây",
+        "description": "Phân tích dữ liệu dịch tễ, môi trường, và hành vi để dự báo dịch bệnh, hỗ trợ Sở Y tế và Bộ Y tế trong ra quyết định chính sách.",
+        "category": "Nghiên cứu - Dịch tễ học"
+    },
+    {
+        "title": "Học viện Y học chính xác & Y học cá thể hóa",
+        "description": "Kết hợp dữ liệu gen, hình ảnh y khoa, lối sống và AI để nghiên cứu và ứng dụng điều trị cá thể hóa cho bệnh ung thư, tim mạch và bệnh mạn tính.",
+        "category": "Nghiên cứu - Y học chính xác"
+    }
+]
+
+async def main():
+    """Add all UMP ideas to the database"""
+    print("Initializing Qdrant service...")
+    qdrant_service = get_qdrant_service()
+    
+    print("Initializing collection...")
+    await qdrant_service.initialize_collection()
+    
+    print(f"Adding {len(UMP_IDEAS)} ideas to the database...")
+    results = []
+    for i, idea in enumerate(UMP_IDEAS, 1):
+        try:
+            print(f"Adding idea {i}/{len(UMP_IDEAS)}: {idea['title']}")
+            result = await qdrant_service.add_idea(
+                title=idea['title'],
+                description=idea['description'],
+                category=idea['category']
+            )
+            results.append(result)
+            print(f"✓ Added: {result['id']}")
+        except Exception as e:
+            print(f"✗ Error adding idea {i}: {e}")
+    
+    print(f"\n✓ Successfully added {len(results)}/{len(UMP_IDEAS)} ideas")
+    return results
+
+if __name__ == "__main__":
+    asyncio.run(main())
@@ -0,0 +1,86 @@
+#!/usr/bin/env bash
+# Apply migration 007 (user_roles.admin_from_email_policy) to an EXISTING Postgres.
+# initdb scripts in docker-entrypoint-initdb.d run only on first volume creation.
+#
+# Default (full SQL file): adds column, runs one-time policy DELETE/UPDATE (see
+# be0/migrations/007_user_roles_email_policy_admin.sql before running on prod).
+#
+# Usage (from anywhere):
+#   ./be0/scripts/apply-migration-007.sh
+#   ./be0/scripts/apply-migration-007.sh --schema-only   # only ADD COLUMN (safest repeat)
+#
+# On a remote host (SSH to be0/docker host, repo or copy of migrations present):
+#   export POSTGRES_CONTAINER=initiative-postgres POSTGRES_USER=initiative POSTGRES_DB=initiatives
+#   ./be0/scripts/apply-migration-007.sh
+#
+# From repo root (wrapper):
+#   ./scripts/apply-migration-007-postgres.sh
+set -euo pipefail
+
+SCHEMA_ONLY=0
+for arg in "$@"; do
+  case "$arg" in
+    --schema-only) SCHEMA_ONLY=1 ;;
+    -h|--help)
+      sed -n '2,20p' "$0"
+      exit 0
+      ;;
+  esac
+done
+
+BE0_ROOT="$(cd "$(dirname "$0")/.." && pwd)"
+SQL_FULL="$BE0_ROOT/migrations/007_user_roles_email_policy_admin.sql"
+CONTAINER="${POSTGRES_CONTAINER:-initiative-postgres}"
+PGUSER="${POSTGRES_USER:-initiative}"
+PGDATABASE="${POSTGRES_DB:-initiatives}"
+
+if ! docker info >/dev/null 2>&1; then
+  echo "error: Docker is not reachable (is the daemon running?)" >&2
+  exit 1
+fi
+if ! docker inspect "$CONTAINER" >/dev/null 2>&1; then
+  echo "error: container not found: $CONTAINER (set POSTGRES_CONTAINER)" >&2
+  exit 1
+fi
+if [[ "$(docker inspect -f '{{.State.Running}}' "$CONTAINER" 2>/dev/null || echo false)" != "true" ]]; then
+  echo "error: container is not running: $CONTAINER" >&2
+  exit 1
+fi
+
+apply_schema_only() {
+  docker exec -i "$CONTAINER" psql -U "$PGUSER" -d "$PGDATABASE" -v ON_ERROR_STOP=1 <<'SQL'
+ALTER TABLE user_roles ADD COLUMN IF NOT EXISTS admin_from_email_policy BOOLEAN NOT NULL DEFAULT FALSE;
+
+COMMENT ON COLUMN user_roles.admin_from_email_policy IS
+  'TRUE when admin was granted by email allow-list (AUTH_ADMIN_EMAILS). Reconciliation may DELETE this row if the user email is no longer in the list. FALSE preserves manually granted admin (future / exceptional).';
+SQL
+}
+
+apply_full() {
+  if [[ ! -f "$SQL_FULL" ]]; then
+    echo "error: missing migration file: $SQL_FULL" >&2
+    exit 1
+  fi
+  docker exec -i "$CONTAINER" psql -U "$PGUSER" -d "$PGDATABASE" -v ON_ERROR_STOP=1 <"$SQL_FULL"
+}
+
+verify_column() {
+  local out
+  out="$(docker exec "$CONTAINER" psql -U "$PGUSER" -d "$PGDATABASE" -tAc \
+    "SELECT 1 FROM information_schema.columns WHERE table_schema = 'public' AND table_name = 'user_roles' AND column_name = 'admin_from_email_policy'")"
+  if [[ "${out//$'\r'/}" != "1" ]]; then
+    echo "error: verification failed: column admin_from_email_policy missing on public.user_roles" >&2
+    exit 1
+  fi
+}
+
+if (( SCHEMA_ONLY )); then
+  echo "Applying schema only (ADD COLUMN + COMMENT) → $CONTAINER / $PGDATABASE"
+  apply_schema_only
+else
+  echo "Applying full 007_user_roles_email_policy_admin.sql → $CONTAINER / $PGDATABASE"
+  apply_full
+fi
+
+verify_column
+echo "ok: user_roles.admin_from_email_policy is present; admin register/login should work with current be0."
@@ -0,0 +1,533 @@
+"""
+Apply idempotent SQL fixes when the DB volume predates newer migrations.
+
+- ``008_audit_events.sql`` when ``audit_events`` is missing (older volumes never
+  ran ``docker-entrypoint-initdb.d`` for new files).
+- ``009_backup_artifact_roles_storage_kind.sql`` when ``storage_kind`` is missing.
+- ``010_user_staff_profiles.sql`` + ``011_academic_titles_vn.sql`` when
+  ``academic_titles`` is missing (staff profile / register flow).
+- ``013_email_verification.sql`` when ``email_verification_tokens`` is missing.
+- ``014_registration_otp.sql`` when ``registration_otp_codes`` is missing.
+
+Run automatically from entrypoint when ``INITIATIVE_DATABASE_URL`` is set.
+Standalone:
+
+  INITIATIVE_DATABASE_URL=postgresql+asyncpg://user:pass@host:5432/dbname \\
+    python scripts/apply_initiative_migrations.py
+"""
+
+from __future__ import annotations
+
+import asyncio
+import os
+import sys
+from pathlib import Path
+
+
+def _async_url_to_asyncpg_dsn(url: str) -> str:
+    u = url.strip()
+    if "+asyncpg" in u:
+        u = u.replace("postgresql+asyncpg://", "postgresql://", 1)
+    return u
+
+
+def _strip_sql_comments(text: str) -> str:
+    lines: list[str] = []
+    for line in text.splitlines():
+        s = line.strip()
+        if s.startswith("--"):
+            continue
+        lines.append(line)
+    return "\n".join(lines)
+
+
+def _split_sql_statements(text: str) -> list[str]:
+    """Split on semicolons outside ``$$`` dollar-quoted blocks (008 uses ``DO $$``)."""
+    statements: list[str] = []
+    buf: list[str] = []
+    i = 0
+    n = len(text)
+    in_dollar = False
+    while i < n:
+        if text.startswith("$$", i):
+            in_dollar = not in_dollar
+            buf.append("$$")
+            i += 2
+            continue
+        ch = text[i]
+        if ch == ";" and not in_dollar:
+            stmt = "".join(buf).strip()
+            if stmt:
+                statements.append(stmt)
+            buf = []
+            i += 1
+            continue
+        buf.append(ch)
+        i += 1
+    tail = "".join(buf).strip()
+    if tail:
+        statements.append(tail)
+    return statements
+
+
+async def _needs_audit_events_migration(conn) -> bool:
+    row = await conn.fetchrow(
+        """
+        SELECT 1
+        FROM information_schema.tables
+        WHERE table_schema = 'public'
+          AND table_name = 'audit_events'
+        LIMIT 1
+        """
+    )
+    return row is None
+
+
+async def _needs_backup_migration(conn) -> bool:
+    row = await conn.fetchrow(
+        """
+        SELECT 1
+        FROM information_schema.columns
+        WHERE table_schema = 'public'
+          AND table_name = 'application_artifacts'
+          AND column_name = 'storage_kind'
+        LIMIT 1
+        """
+    )
+    return row is None
+
+
+async def _needs_staff_profiles_migration(conn) -> bool:
+    row = await conn.fetchrow(
+        """
+        SELECT 1
+        FROM information_schema.tables
+        WHERE table_schema = 'public'
+          AND table_name = 'academic_titles'
+        LIMIT 1
+        """
+    )
+    return row is None
+
+
+async def _needs_email_verification_migration(conn) -> bool:
+    """True when verification tokens table is missing (013 also adds users.email_verified)."""
+    row = await conn.fetchrow(
+        """
+        SELECT 1
+        FROM information_schema.tables
+        WHERE table_schema = 'public'
+          AND table_name = 'email_verification_tokens'
+        LIMIT 1
+        """
+    )
+    return row is None
+
+
+async def _needs_registration_otp_migration(conn) -> bool:
+    row = await conn.fetchrow(
+        """
+        SELECT 1
+        FROM information_schema.tables
+        WHERE table_schema = 'public'
+          AND table_name = 'registration_otp_codes'
+        LIMIT 1
+        """
+    )
+    return row is None
+
+
+async def _needs_document_templates_migration(conn) -> bool:
+    row = await conn.fetchrow(
+        """
+        SELECT 1
+        FROM information_schema.tables
+        WHERE table_schema = 'public'
+          AND table_name = 'document_templates'
+        LIMIT 1
+        """
+    )
+    return row is None
+
+
+async def _needs_research_projects_migration(conn) -> bool:
+    row = await conn.fetchrow(
+        """
+        SELECT 1
+        FROM information_schema.tables
+        WHERE table_schema = 'public'
+          AND table_name = 'research_projects'
+        LIMIT 1
+        """
+    )
+    return row is None
+
+
+async def _needs_imagehub_datasets_migration(conn) -> bool:
+    row = await conn.fetchrow(
+        """
+        SELECT 1
+        FROM information_schema.tables
+        WHERE table_schema = 'public'
+          AND table_name = 'imagehub_datasets'
+        LIMIT 1
+        """
+    )
+    return row is None
+
+
+async def _needs_imagehub_segmentation_columns_migration(conn) -> bool:
+    """True when imagehub_dataset_files lacks the segmentation-link columns (018)."""
+    row = await conn.fetchrow(
+        """
+        SELECT 1
+        FROM information_schema.columns
+        WHERE table_schema = 'public'
+          AND table_name = 'imagehub_dataset_files'
+          AND column_name = 'file_kind'
+        LIMIT 1
+        """
+    )
+    return row is None
+
+
+async def _needs_cloud_import_migration(conn) -> bool:
+    """True when the cloud-import storage_methods table is absent (019)."""
+    row = await conn.fetchrow(
+        """
+        SELECT 1
+        FROM information_schema.tables
+        WHERE table_schema = 'public'
+          AND table_name = 'imagehub_storage_methods'
+        LIMIT 1
+        """
+    )
+    return row is None
+
+
+async def _needs_imagehub_stages_migration(conn) -> bool:
+    """True when the dataset-stages table is absent (020)."""
+    row = await conn.fetchrow(
+        """
+        SELECT 1
+        FROM information_schema.tables
+        WHERE table_schema = 'public'
+          AND table_name = 'imagehub_dataset_stages'
+        LIMIT 1
+        """
+    )
+    return row is None
+
+
+async def _needs_imagehub_tasks_migration(conn) -> bool:
+    """True when the per-file task-pipeline table is absent (021)."""
+    row = await conn.fetchrow(
+        """
+        SELECT 1
+        FROM information_schema.tables
+        WHERE table_schema = 'public'
+          AND table_name = 'imagehub_tasks'
+        LIMIT 1
+        """
+    )
+    return row is None
+
+
+async def _needs_imagehub_task_annotations_migration(conn) -> bool:
+    """True when imagehub_tasks lacks the annotations column (022)."""
+    row = await conn.fetchrow(
+        """
+        SELECT 1
+        FROM information_schema.columns
+        WHERE table_schema = 'public'
+          AND table_name = 'imagehub_tasks'
+          AND column_name = 'annotations'
+        LIMIT 1
+        """
+    )
+    return row is None
+
+
+async def _needs_imagehub_members_migration(conn) -> bool:
+    """True when the dataset-membership table is absent (023)."""
+    row = await conn.fetchrow(
+        """
+        SELECT 1
+        FROM information_schema.tables
+        WHERE table_schema = 'public'
+          AND table_name = 'imagehub_dataset_members'
+        LIMIT 1
+        """
+    )
+    return row is None
+
+
+async def _needs_imagehub_dataset_project_link_migration(conn) -> bool:
+    """True when imagehub_datasets.research_project_id is absent (024)."""
+    row = await conn.fetchrow(
+        """
+        SELECT 1
+        FROM information_schema.columns
+        WHERE table_schema = 'public'
+          AND table_name = 'imagehub_datasets'
+          AND column_name = 'research_project_id'
+        LIMIT 1
+        """
+    )
+    return row is None
+
+
+async def _needs_imagehub_review_events_migration(conn) -> bool:
+    """True when the task-review-events table is absent (025)."""
+    row = await conn.fetchrow(
+        """
+        SELECT 1
+        FROM information_schema.tables
+        WHERE table_schema = 'public'
+          AND table_name = 'imagehub_task_review_events'
+        LIMIT 1
+        """
+    )
+    return row is None
+
+
+async def _needs_imagehub_folder_path_migration(conn) -> bool:
+    """True when imagehub_dataset_files.folder_path is absent (026)."""
+    row = await conn.fetchrow(
+        """
+        SELECT 1
+        FROM information_schema.columns
+        WHERE table_schema = 'public'
+          AND table_name = 'imagehub_dataset_files'
+          AND column_name = 'folder_path'
+        LIMIT 1
+        """
+    )
+    return row is None
+
+
+async def _needs_imagehub_label_map_migration(conn) -> bool:
+    """True when imagehub_datasets.label_map is absent (027)."""
+    row = await conn.fetchrow(
+        """
+        SELECT 1
+        FROM information_schema.columns
+        WHERE table_schema = 'public'
+          AND table_name = 'imagehub_datasets'
+          AND column_name = 'label_map'
+        LIMIT 1
+        """
+    )
+    return row is None
+
+
+async def _apply_sql_file(conn, path: Path, label: str) -> None:
+    body = _strip_sql_comments(path.read_text(encoding="utf-8"))
+    for stmt in _split_sql_statements(body):
+        await conn.execute(stmt)
+    print(f"apply_initiative_migrations: {label} applied.")
+
+
+async def main() -> int:
+    raw_url = (os.environ.get("INITIATIVE_DATABASE_URL") or "").strip()
+    if not raw_url.lower().startswith("postgresql"):
+        print("apply_initiative_migrations: no PostgreSQL URL; skipping.", file=sys.stderr)
+        return 0
+
+    root = Path(__file__).resolve().parent.parent
+    m008 = root / "migrations" / "008_audit_events.sql"
+    m009 = root / "migrations" / "009_backup_artifact_roles_storage_kind.sql"
+    m010 = root / "migrations" / "010_user_staff_profiles.sql"
+    m011 = root / "migrations" / "011_academic_titles_vn.sql"
+    for p in (m008, m009, m010, m011):
+        if not p.is_file():
+            print(f"apply_initiative_migrations: missing {p}", file=sys.stderr)
+            return 1
+
+    import asyncpg
+
+    dsn = _async_url_to_asyncpg_dsn(raw_url)
+    conn = await asyncpg.connect(dsn, timeout=60)
+    try:
+        if await _needs_audit_events_migration(conn):
+            print("apply_initiative_migrations: applying 008_audit_events …")
+            await _apply_sql_file(conn, m008, "008_audit_events")
+        else:
+            print("apply_initiative_migrations: audit_events present; OK.")
+
+        if await _needs_backup_migration(conn):
+            print("apply_initiative_migrations: applying 009_backup_artifact_roles_storage_kind …")
+            await _apply_sql_file(conn, m009, "009_backup_artifact_roles_storage_kind")
+        else:
+            print("apply_initiative_migrations: application_artifacts.storage_kind present; OK.")
+
+        if await _needs_staff_profiles_migration(conn):
+            print("apply_initiative_migrations: applying 010_user_staff_profiles …")
+            await _apply_sql_file(conn, m010, "010_user_staff_profiles")
+            print("apply_initiative_migrations: applying 011_academic_titles_vn …")
+            await _apply_sql_file(conn, m011, "011_academic_titles_vn")
+        else:
+            print("apply_initiative_migrations: academic_titles present; OK.")
+
+        m013 = root / "migrations" / "013_email_verification.sql"
+        if not m013.is_file():
+            print(f"apply_initiative_migrations: missing {m013}", file=sys.stderr)
+            return 1
+        if await _needs_email_verification_migration(conn):
+            print("apply_initiative_migrations: applying 013_email_verification …")
+            await _apply_sql_file(conn, m013, "013_email_verification")
+        else:
+            print("apply_initiative_migrations: email_verification_tokens present; OK.")
+
+        m014 = root / "migrations" / "014_registration_otp.sql"
+        if not m014.is_file():
+            print(f"apply_initiative_migrations: missing {m014}", file=sys.stderr)
+            return 1
+        if await _needs_registration_otp_migration(conn):
+            print("apply_initiative_migrations: applying 014_registration_otp …")
+            await _apply_sql_file(conn, m014, "014_registration_otp")
+        else:
+            print("apply_initiative_migrations: registration_otp_codes present; OK.")
+
+        m015 = root / "migrations" / "015_document_templates.sql"
+        if not m015.is_file():
+            print(f"apply_initiative_migrations: missing {m015}", file=sys.stderr)
+            return 1
+        if await _needs_document_templates_migration(conn):
+            print("apply_initiative_migrations: applying 015_document_templates …")
+            await _apply_sql_file(conn, m015, "015_document_templates")
+        else:
+            print("apply_initiative_migrations: document_templates present; OK.")
+
+        m016 = root / "migrations" / "016_research_projects.sql"
+        if not m016.is_file():
+            print(f"apply_initiative_migrations: missing {m016}", file=sys.stderr)
+            return 1
+        if await _needs_research_projects_migration(conn):
+            print("apply_initiative_migrations: applying 016_research_projects …")
+            await _apply_sql_file(conn, m016, "016_research_projects")
+        else:
+            print("apply_initiative_migrations: research_projects present; OK.")
+
+        m017 = root / "migrations" / "017_imagehub_datasets.sql"
+        if not m017.is_file():
+            print(f"apply_initiative_migrations: missing {m017}", file=sys.stderr)
+            return 1
+        if await _needs_imagehub_datasets_migration(conn):
+            print("apply_initiative_migrations: applying 017_imagehub_datasets …")
+            await _apply_sql_file(conn, m017, "017_imagehub_datasets")
+        else:
+            print("apply_initiative_migrations: imagehub_datasets present; OK.")
+
+        m018 = root / "migrations" / "018_imagehub_segmentation_links.sql"
+        if not m018.is_file():
+            print(f"apply_initiative_migrations: missing {m018}", file=sys.stderr)
+            return 1
+        if await _needs_imagehub_segmentation_columns_migration(conn):
+            print("apply_initiative_migrations: applying 018_imagehub_segmentation_links …")
+            await _apply_sql_file(conn, m018, "018_imagehub_segmentation_links")
+        else:
+            print("apply_initiative_migrations: imagehub_dataset_files.file_kind present; OK.")
+
+        m019 = root / "migrations" / "019_imagehub_cloud_import.sql"
+        if not m019.is_file():
+            print(f"apply_initiative_migrations: missing {m019}", file=sys.stderr)
+            return 1
+        if await _needs_cloud_import_migration(conn):
+            print("apply_initiative_migrations: applying 019_imagehub_cloud_import …")
+            await _apply_sql_file(conn, m019, "019_imagehub_cloud_import")
+        else:
+            print("apply_initiative_migrations: imagehub_storage_methods present; OK.")
+
+        m020 = root / "migrations" / "020_imagehub_dataset_stages.sql"
+        if not m020.is_file():
+            print(f"apply_initiative_migrations: missing {m020}", file=sys.stderr)
+            return 1
+        if await _needs_imagehub_stages_migration(conn):
+            print("apply_initiative_migrations: applying 020_imagehub_dataset_stages …")
+            await _apply_sql_file(conn, m020, "020_imagehub_dataset_stages")
+        else:
+            print("apply_initiative_migrations: imagehub_dataset_stages present; OK.")
+
+        m021 = root / "migrations" / "021_imagehub_task_pipeline.sql"
+        if not m021.is_file():
+            print(f"apply_initiative_migrations: missing {m021}", file=sys.stderr)
+            return 1
+        if await _needs_imagehub_tasks_migration(conn):
+            print("apply_initiative_migrations: applying 021_imagehub_task_pipeline …")
+            await _apply_sql_file(conn, m021, "021_imagehub_task_pipeline")
+        else:
+            print("apply_initiative_migrations: imagehub_tasks present; OK.")
+
+        m022 = root / "migrations" / "022_imagehub_task_annotations.sql"
+        if not m022.is_file():
+            print(f"apply_initiative_migrations: missing {m022}", file=sys.stderr)
+            return 1
+        if await _needs_imagehub_task_annotations_migration(conn):
+            print("apply_initiative_migrations: applying 022_imagehub_task_annotations …")
+            await _apply_sql_file(conn, m022, "022_imagehub_task_annotations")
+        else:
+            print("apply_initiative_migrations: imagehub_tasks.annotations present; OK.")
+
+        m023 = root / "migrations" / "023_imagehub_dataset_members.sql"
+        if not m023.is_file():
+            print(f"apply_initiative_migrations: missing {m023}", file=sys.stderr)
+            return 1
+        if await _needs_imagehub_members_migration(conn):
+            print("apply_initiative_migrations: applying 023_imagehub_dataset_members …")
+            await _apply_sql_file(conn, m023, "023_imagehub_dataset_members")
+        else:
+            print("apply_initiative_migrations: imagehub_dataset_members present; OK.")
+
+        m024 = root / "migrations" / "024_imagehub_dataset_project_link.sql"
+        if not m024.is_file():
+            print(f"apply_initiative_migrations: missing {m024}", file=sys.stderr)
+            return 1
+        if await _needs_imagehub_dataset_project_link_migration(conn):
+            print("apply_initiative_migrations: applying 024_imagehub_dataset_project_link …")
+            await _apply_sql_file(conn, m024, "024_imagehub_dataset_project_link")
+        else:
+            print("apply_initiative_migrations: imagehub_datasets.research_project_id present; OK.")
+
+        m025 = root / "migrations" / "025_imagehub_task_review_events.sql"
+        if not m025.is_file():
+            print(f"apply_initiative_migrations: missing {m025}", file=sys.stderr)
+            return 1
+        if await _needs_imagehub_review_events_migration(conn):
+            print("apply_initiative_migrations: applying 025_imagehub_task_review_events …")
+            await _apply_sql_file(conn, m025, "025_imagehub_task_review_events")
+        else:
+            print("apply_initiative_migrations: imagehub_task_review_events present; OK.")
+
+        m026 = root / "migrations" / "026_imagehub_file_folder_path.sql"
+        if not m026.is_file():
+            print(f"apply_initiative_migrations: missing {m026}", file=sys.stderr)
+            return 1
+        if await _needs_imagehub_folder_path_migration(conn):
+            print("apply_initiative_migrations: applying 026_imagehub_file_folder_path …")
+            await _apply_sql_file(conn, m026, "026_imagehub_file_folder_path")
+        else:
+            print("apply_initiative_migrations: imagehub_dataset_files.folder_path present; OK.")
+
+        m027 = root / "migrations" / "027_imagehub_dataset_label_map.sql"
+        if not m027.is_file():
+            print(f"apply_initiative_migrations: missing {m027}", file=sys.stderr)
+            return 1
+        if await _needs_imagehub_label_map_migration(conn):
+            print("apply_initiative_migrations: applying 027_imagehub_dataset_label_map …")
+            await _apply_sql_file(conn, m027, "027_imagehub_dataset_label_map")
+        else:
+            print("apply_initiative_migrations: imagehub_datasets.label_map present; OK.")
+
+        return 0
+    except Exception as exc:
+        print(f"apply_initiative_migrations: FAILED: {exc}", file=sys.stderr)
+        if os.environ.get("INITIATIVE_DB_STRICT_MIGRATE", "").strip().lower() in ("1", "true", "yes"):
+            return 1
+        return 0
+    finally:
+        await conn.close()
+
+
+if __name__ == "__main__":
+    raise SystemExit(asyncio.run(main()))
@@ -0,0 +1,90 @@
+#!/usr/bin/env python3
+"""
+CLI: merge a mis-linked submission onto the real CASE-* initiative row and delete the orphan initiative.
+
+Usage (dry-run — default, no writes):
+
+  cd be0
+  export INITIATIVE_DATABASE_URL="postgresql+asyncpg://user:pass@host:5432/initiatives"
+  python scripts/repair_split_submission.py --submission-id sub-d560fbb6f2944ec6
+
+Apply (commits one transaction):
+
+  python scripts/repair_split_submission.py --submission-id sub-... --good-case CASE-YOURCODE --execute
+
+Requires the same Postgres URL as the API (`INITIATIVE_DATABASE_URL` / `DATABASE_URL`).
+"""
+from __future__ import annotations
+
+import argparse
+import asyncio
+import os
+import sys
+
+SCRIPT_DIR = os.path.dirname(os.path.abspath(__file__))
+ROOT = os.path.abspath(os.path.join(SCRIPT_DIR, ".."))
+if ROOT not in sys.path:
+    sys.path.insert(0, ROOT)
+
+
+async def _main_async() -> int:
+    p = argparse.ArgumentParser(description="Repair split submission / wrong initiative linkage.")
+    p.add_argument(
+        "--submission-id",
+        required=True,
+        help="submissionRecord.id (e.g. sub-d560fbb6f2944ec6)",
+    )
+    p.add_argument(
+        "--good-case",
+        dest="good_case",
+        default=None,
+        help="Explicit CASE-* code for the autosave row (recommended if owner has multiple drafts)",
+    )
+    p.add_argument(
+        "--execute",
+        action="store_true",
+        help="Apply changes (otherwise dry-run only)",
+    )
+    args = p.parse_args()
+
+    os.environ.setdefault("INITIATIVE_DATABASE_URL", os.getenv("DATABASE_URL") or "")
+    from src.initiative_db.engine import get_session, init_engine, is_postgres_enabled
+    from src.initiative_db.repair_split_submission import repair_submission_cross_initiative_merge
+
+    if not is_postgres_enabled():
+        print("Error: set INITIATIVE_DATABASE_URL=postgresql+asyncpg://.../initiatives", file=sys.stderr)
+        return 2
+
+    await init_engine()
+
+    async with get_session() as session:
+        report = await repair_submission_cross_initiative_merge(
+            session,
+            submission_record_id=args.submission_id.strip(),
+            good_case_code_explicit=(args.good_case or "").strip() or None,
+            dry_run=not args.execute,
+        )
+
+    lines = [
+        f"dry_run={report.dry_run}",
+        f"submission_record_id={report.submission_record_id}",
+        f"owner_id={report.owner_id or '(n/a)'}",
+        f"bad_case={report.bad_case_code or '(n/a)'}",
+        f"good_case={report.good_case_code or '(n/a)'}",
+    ]
+    if report.skipped:
+        lines.append(f"SKIPPED: {report.skipped}")
+    lines.extend(report.actions)
+    print("\n".join(lines))
+
+    if args.execute and report.skipped:
+        return 3
+    return 0
+
+
+def main() -> None:
+    raise SystemExit(asyncio.run(_main_async()))
+
+
+if __name__ == "__main__":
+    main()
--- a/Show More
+++ b/Show More