Files
HSAP/platform/as_platform/data/ingest/registry.py
Chengfang Lu e72bc061c5 feat: HSAP platform v2 — modular navigation, quality review, audit log, world model simulation
Major changes:
- New frontend (platform/web/): Vite + React 18 + TypeScript + Tailwind
- 4-module navigation: 数据送标 / 模型管理 / 车队管理 / 系统管理
- Data catalog with charts (DMS/ADAS/Lane 3-tab view)
- Quality review workflow (标注质检): Good/Fine/Bad scoring with auto-advance
- Audit enhancements: batch operations, rejection categories, Feishu notifications
- Operation audit log (操作日志)
- World model simulation studio (仿真工坊)
- Dataset version management with snapshots and diff
- ADAS 7-class dataset integration (138K images organized + compressed)
- User management with Feishu integration and pagination
- CRUD/search/filter on all pages, card layout redesign
- PIL-optimized image overlay rendering
- Auto-snapshot on build, in_review workflow stage
- Removed embedded algorithm code (now in workspace)
2026-06-03 11:40:21 +08:00

58 lines
2.0 KiB
Python
Raw Blame History

This file contains ambiguous Unicode characters
This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.
"""Adapter registry and auto detection for uploaded datasets."""
from __future__ import annotations
from pathlib import Path
from as_platform.data.ingest.base import IngestAdapter, IngestContext, NormalizedDataset
from as_platform.data.ingest.dms_coco import DmsCocoAdapter
from as_platform.data.ingest.dms_inbox_raw import DmsInboxRawAdapter
from as_platform.data.ingest.dms_yolo import DmsYoloAdapter
from as_platform.data.ingest.lane_lines import LaneLinesAdapter
from as_platform.data.ingest.lane_mask import LaneMaskAdapter
class UnknownFormatError(ValueError):
pass
ADAPTERS: tuple[IngestAdapter, ...] = (
DmsYoloAdapter(),
DmsCocoAdapter(),
DmsInboxRawAdapter(),
LaneMaskAdapter(),
LaneLinesAdapter(),
)
def available_formats(project: str) -> list[str]:
return [a.format_id for a in ADAPTERS if project in a.projects]
def detect_adapter(ctx: IngestContext) -> IngestAdapter:
for adapter in ADAPTERS:
if ctx.project not in adapter.projects:
continue
if adapter.can_handle(ctx):
return adapter
hint = ""
if ctx.project == "dms":
hint = (
"DMS 送标/inbox 请使用批次根目录,且至少包含 images/train/*.jpg"
"(或已标注的 images/+labels/、COCO annotations/"
)
raise UnknownFormatError(
f"unable to detect format for project={ctx.project}, task={ctx.task}, "
f"source={ctx.source_path}. supported={available_formats(ctx.project)}{hint}"
)
def inspect_uploaded_dataset(project: str, task: str | None, source_path: str | Path) -> NormalizedDataset:
ctx = IngestContext(project=project, task=task, source_path=Path(source_path).resolve())
if not ctx.source_path.exists():
raise FileNotFoundError(f"source path not found: {ctx.source_path}")
adapter = detect_adapter(ctx)
out = adapter.inspect(ctx)
# Ensure adapter id is always reflected in output.
out.format_id = adapter.format_id
return out