AdaptiveMotorControlLab · xiu-cs · Feb 10, 2026 · Feb 9, 2026 · Feb 9, 2026 · Feb 9, 2026
diff --git a/demo/vis_in_the_wild.py b/demo/vis_in_the_wild.py
@@ -25,17 +25,10 @@
 
 args = parse_args().parse()
 os.environ["CUDA_VISIBLE_DEVICES"] = args.gpu
-if getattr(args, 'model_path', ''):
-    import importlib.util
-    import pathlib
-    model_abspath = os.path.abspath(args.model_path)
-    module_name = pathlib.Path(model_abspath).stem
-    spec = importlib.util.spec_from_file_location(module_name, model_abspath)
-    module = importlib.util.module_from_spec(spec)
-    assert spec.loader is not None
-    spec.loader.exec_module(module)
-    CFM = getattr(module, 'Model')
-
+
+from fmpose3d.models import get_model
+CFM = get_model(args.model_type)
+
 from fmpose3d.common.camera import *
 
 import matplotlib

diff --git a/demo/vis_in_the_wild.sh b/demo/vis_in_the_wild.sh
@@ -5,7 +5,7 @@ sample_steps=3
 batch_size=1
 sh_file='vis_in_the_wild.sh'
 
-model_path='../pre_trained_models/fmpose3d_h36m/model_GAMLP.py'
+model_type='fmpose3d'
 model_weights_path='../pre_trained_models/fmpose3d_h36m/FMpose3D_pretrained_weights.pth'
 
 target_path='./images/'  # folder containing multiple images
@@ -16,7 +16,7 @@ python3 vis_in_the_wild.py \
  --type 'image' \
  --path ${target_path} \
  --model_weights_path "${model_weights_path}" \
- --model_path "${model_path}" \
+ --model_type "${model_type}" \
  --sample_steps ${sample_steps} \
  --batch_size ${batch_size} \
  --layers ${layers} \

diff --git a/fmpose3d/common/__init__.py b/fmpose3d/common/__init__.py
@@ -12,6 +12,19 @@
 """
 
 from .arguments import opts
+from .config import (
+    FMPoseConfig,
+    ModelConfig,
+    DatasetConfig,
+    TrainingConfig,
+    InferenceConfig,
+    AggregationConfig,
+    CheckpointConfig,
+    RefinementConfig,
+    OutputConfig,
+    DemoConfig,
+    RuntimeConfig,
+)
 from .h36m_dataset import Human36mDataset
 from .load_data_hm36 import Fusion
 from .utils import (
@@ -27,6 +40,17 @@
 
 __all__ = [
     "opts",
+    "FMPoseConfig",
+    "ModelConfig",
+    "DatasetConfig",
+    "TrainingConfig",
+    "InferenceConfig",
+    "AggregationConfig",
+    "CheckpointConfig",
+    "RefinementConfig",
+    "OutputConfig",
+    "DemoConfig",
+    "RuntimeConfig",
     "Human36mDataset",
     "Fusion",
     "mpjpe_cal",

diff --git a/fmpose3d/common/arguments.py b/fmpose3d/common/arguments.py
@@ -74,6 +74,8 @@ def init(self):
         self.parser.add_argument("--model_dir", type=str, default="")
         # Optional: load model class from a specific file path
         self.parser.add_argument("--model_path", type=str, default="")
+        # Model registry name (e.g. "fmpose3d"); used instead of --model_path
+        self.parser.add_argument("--model_type", type=str, default="fmpose3d")
         self.parser.add_argument("--model_weights_path", type=str, default="")
 
         self.parser.add_argument("--post_refine_reload", action="store_true")

diff --git a/fmpose3d/common/config.py b/fmpose3d/common/config.py
@@ -0,0 +1,233 @@
+"""
+FMPose3D: monocular 3D Pose Estimation via Flow Matching
+
+Official implementation of the paper:
+"FMPose3D: monocular 3D Pose Estimation via Flow Matching"
+by Ti Wang, Xiaohang Yu, and Mackenzie Weygandt Mathis
+Licensed under Apache 2.0
+"""
+
+import math
+from dataclasses import dataclass, field, fields, asdict
+from typing import List
+
+
+# ---------------------------------------------------------------------------
+# Dataclass configuration groups
+# ---------------------------------------------------------------------------
+
+
+@dataclass
+class ModelConfig:
+    """Model architecture configuration."""
+
+    model: str = ""
+    model_type: str = "fmpose3d"
+    layers: int = 3
+    channel: int = 512
+    d_hid: int = 1024
+    token_dim: int = 256
+    n_joints: int = 17
+    out_joints: int = 17
+    in_channels: int = 2
+    out_channels: int = 3
+    frames: int = 1
+    """Optional: load model class from a specific file path."""
+
+
+@dataclass
+class DatasetConfig:
+    """Dataset and data loading configuration."""
+
+    dataset: str = "h36m"
+    keypoints: str = "cpn_ft_h36m_dbb"
+    root_path: str = "dataset/"
+    actions: str = "*"
+    downsample: int = 1
+    subset: float = 1.0
+    stride: int = 1
+    crop_uv: int = 0
+    out_all: int = 1
+    train_views: List[int] = field(default_factory=lambda: [0, 1, 2, 3])
+    test_views: List[int] = field(default_factory=lambda: [0, 1, 2, 3])
+
+    # Derived / set during parse based on dataset choice
+    subjects_train: str = "S1,S5,S6,S7,S8"
+    subjects_test: str = "S9,S11"
+    root_joint: int = 0
+    joints_left: List[int] = field(default_factory=list)
+    joints_right: List[int] = field(default_factory=list)
+
+
+@dataclass
+class TrainingConfig:
+    """Training hyperparameters and settings."""
+
+    train: bool = False
+    nepoch: int = 41
+    batch_size: int = 128
+    lr: float = 1e-3
+    lr_decay: float = 0.95
+    lr_decay_large: float = 0.5
+    large_decay_epoch: int = 5
+    workers: int = 8
+    data_augmentation: bool = True
+    reverse_augmentation: bool = False
+    norm: float = 0.01
+
+
+@dataclass
+class InferenceConfig:
+    """Evaluation and testing configuration."""
+
+    test: int = 1
+    test_augmentation: bool = True
+    test_augmentation_flip_hypothesis: bool = False
+    test_augmentation_FlowAug: bool = False
+    sample_steps: int = 3
+    eval_multi_steps: bool = False
+    eval_sample_steps: str = "1,3,5,7,9"
+    num_hypothesis_list: str = "1"
+    hypothesis_num: int = 1
+    guidance_scale: float = 1.0
+
+
+@dataclass
+class AggregationConfig:
+    """Hypothesis aggregation configuration."""
+
+    topk: int = 3
+    exp_temp: float = 0.002
+    mode: str = "exp"
+    opt_steps: int = 2
+
+
+@dataclass
+class CheckpointConfig:
+    """Checkpoint loading and saving configuration."""
+
+    reload: bool = False
+    model_dir: str = ""
+    model_weights_path: str = ""
+    checkpoint: str = ""
+    previous_dir: str = "./pre_trained_model/pretrained"
+    num_saved_models: int = 3
+    previous_best_threshold: float = math.inf
+    previous_name: str = ""
+
+
+@dataclass
+class RefinementConfig:
+    """Post-refinement model configuration."""
+
+    post_refine: bool = False
+    post_refine_reload: bool = False
+    previous_post_refine_name: str = ""
+    lr_refine: float = 1e-5
+    refine: bool = False
+    reload_refine: bool = False
+    previous_refine_name: str = ""
+
+
+@dataclass
+class OutputConfig:
+    """Output, logging, and file management configuration."""
+
+    create_time: str = ""
+    filename: str = ""
+    create_file: int = 1
+    debug: bool = False
+    folder_name: str = ""
+    sh_file: str = ""
+
+
+@dataclass
+class DemoConfig:
+    """Demo / inference configuration."""
+
+    type: str = "image"
+    """Input type: ``'image'`` or ``'video'``."""
+    path: str = "demo/images/running.png"
+    """Path to input file or directory."""
+
+
+@dataclass
+class RuntimeConfig:
+    """Runtime environment configuration."""
+
+    gpu: str = "0"
+    pad: int = 0  # derived: (frames - 1) // 2
+    single: bool = False
+    reload_3d: bool = False
+
+
+# ---------------------------------------------------------------------------
+# Composite configuration
+# ---------------------------------------------------------------------------
+
+_SUB_CONFIG_CLASSES = {
+    "model_cfg": ModelConfig,
+    "dataset_cfg": DatasetConfig,
+    "training_cfg": TrainingConfig,
+    "inference_cfg": InferenceConfig,
+    "aggregation_cfg": AggregationConfig,
+    "checkpoint_cfg": CheckpointConfig,
+    "refinement_cfg": RefinementConfig,
+    "output_cfg": OutputConfig,
+    "demo_cfg": DemoConfig,
+    "runtime_cfg": RuntimeConfig,
+}
+
+
+@dataclass
+class FMPoseConfig:
+    """Top-level configuration for FMPose3D.
+
+    Groups related settings into sub-configs::
+
+        config.model_cfg.layers
+        config.training_cfg.lr
+    """
+
+    model_cfg: ModelConfig = field(default_factory=ModelConfig)
+    dataset_cfg: DatasetConfig = field(default_factory=DatasetConfig)
+    training_cfg: TrainingConfig = field(default_factory=TrainingConfig)
+    inference_cfg: InferenceConfig = field(default_factory=InferenceConfig)
+    aggregation_cfg: AggregationConfig = field(default_factory=AggregationConfig)
+    checkpoint_cfg: CheckpointConfig = field(default_factory=CheckpointConfig)
+    refinement_cfg: RefinementConfig = field(default_factory=RefinementConfig)
+    output_cfg: OutputConfig = field(default_factory=OutputConfig)
+    demo_cfg: DemoConfig = field(default_factory=DemoConfig)
+    runtime_cfg: RuntimeConfig = field(default_factory=RuntimeConfig)
+
+    # -- construction from argparse namespace ---------------------------------
+
+    @classmethod
+    def from_namespace(cls, ns) -> "FMPoseConfig":
+        """Build a :class:`FMPoseConfig` from an ``argparse.Namespace``
+
+        Example::
+
+            args = opts().parse()
+            cfg = FMPoseConfig.from_namespace(args)
+        """
+        raw = vars(ns) if hasattr(ns, "__dict__") else dict(ns)
+
+        def _pick(dc_class, src: dict):
+            names = {f.name for f in fields(dc_class)}
+            return dc_class(**{k: v for k, v in src.items() if k in names})
+
+        return cls(**{
+            group_name: _pick(dc_class, raw)
+            for group_name, dc_class in _SUB_CONFIG_CLASSES.items()
+        })
+
+    # -- utilities ------------------------------------------------------------
+
+    def to_dict(self) -> dict:
+        """Return a flat dictionary of all configuration values."""
+        result = {}
+        for group_name in _SUB_CONFIG_CLASSES:
+            result.update(asdict(getattr(self, group_name)))
+        return result
+
diff --git a/fmpose3d/models/__init__.py b/fmpose3d/models/__init__.py
@@ -11,10 +11,16 @@
 FMPose3D models.
 """
 
-from .graph_frames import Graph
-from .model_GAMLP import Model
+from .base_model import BaseModel, register_model, get_model, list_models
+
+# Import model subpackages so their @register_model decorators execute.
+from .fmpose3d import Graph, Model
 
 __all__ = [
+    "BaseModel",
+    "register_model",
+    "get_model",
+    "list_models",
     "Graph",
     "Model",
 ]