Move metadata xlsx/TSV to /mnt/data/projects/cupido/
Consolidates everything bulky (tracking DBs, targets, metadata spreadsheet) under a single DATA_VOLUME root outside the ownCloud-synced repo. Notebooks now use a visible DATA_DIR = Path(...) idiom rather than walking up the filesystem with PROJECT_ROOT.parent — easier for students with no Python background to follow. Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>
This commit is contained in:
parent
ec56e51bf9
commit
f176224150
8 changed files with 102 additions and 160 deletions
|
|
@ -2,21 +2,26 @@
|
|||
|
||||
from pathlib import Path
|
||||
|
||||
# Where this code repository lives (the directory containing scripts/, notebooks/, ...).
|
||||
PROJECT_ROOT = Path(__file__).resolve().parent.parent
|
||||
DATA_RAW = PROJECT_ROOT / "data" / "raw"
|
||||
DATA_METADATA = PROJECT_ROOT / "data" / "metadata"
|
||||
DATA_PROCESSED = PROJECT_ROOT / "data" / "processed"
|
||||
FIGURES = PROJECT_ROOT / "figures"
|
||||
|
||||
# Offline-tracking pipeline paths
|
||||
VIDEOS_ROOT = Path("/mnt/ethoscope_data/videos")
|
||||
VIDEO_INFO_XLSX = PROJECT_ROOT.parent / "all_video_info_merged.xlsx"
|
||||
INVENTORY_CSV = DATA_METADATA / "video_inventory.csv"
|
||||
# Reason: kept on the local data volume alongside the tracking DBs (out of
|
||||
# ownCloud sync). See TRACKING_OUTPUT_DIR comment below.
|
||||
TARGETS_DIR = Path("/mnt/data/projects/cupido/targets")
|
||||
# Reason: tracking DBs are large binary files that don't belong in
|
||||
# ownCloud-synced storage (sync conflicts + bandwidth). They live on the
|
||||
# local data volume instead. Regenerable from videos + target JSONs.
|
||||
TRACKING_OUTPUT_DIR = Path("/mnt/data/projects/cupido/tracked")
|
||||
LOGS_DIR = PROJECT_ROOT / "data" / "logs"
|
||||
|
||||
# Where the source videos live (read-only NFS mount).
|
||||
VIDEOS_ROOT = Path("/mnt/ethoscope_data/videos")
|
||||
|
||||
# Where the project's bulky data lives — outside the ownCloud-synced repo so
|
||||
# it doesn't churn the cloud sync. This single root holds everything that's
|
||||
# big or regenerable: tracking DBs, target-point JSONs, and the metadata
|
||||
# spreadsheet (xlsx + TSV).
|
||||
DATA_VOLUME = Path("/mnt/data/projects/cupido")
|
||||
TARGETS_DIR = DATA_VOLUME / "targets"
|
||||
TRACKING_OUTPUT_DIR = DATA_VOLUME / "tracked"
|
||||
VIDEO_INFO_XLSX = DATA_VOLUME / "all_video_info_merged.xlsx"
|
||||
VIDEO_INFO_TSV = DATA_VOLUME / "all_video_info_merged.tsv"
|
||||
|
||||
# A small CSV listing every video file we know about (built locally).
|
||||
INVENTORY_CSV = DATA_METADATA / "video_inventory.csv"
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue