first commit

2026-01-12 18:25:04 +09:00
commit cb03f4a6e1
7 changed files with 1124 additions and 0 deletions
--- a/.gitignore
+++ b/.gitignore
@ -0,0 +1,2 @@
 .env
 *.pyc
--- a/dotenv_loader.py
+++ b/dotenv_loader.py
@ -0,0 +1,62 @@
 from __future__ import annotations
 import os
 from pathlib import Path
 from typing import Optional
 def load_dotenv_into_environ(dotenv_path: os.PathLike[str] | str, *, override: bool = False) -> bool:
    """
    Load KEY=VALUE lines from a .env file into os.environ.
    - Supports lines like: KEY=VALUE, export KEY=VALUE
    - Ignores blank lines and # comments
    - Handles single/double-quoted values
    - Does not expand ${VARS} or handle multiline values
    Returns True if the file existed and was read.
    """
    path = Path(dotenv_path)
    if not path.is_file():
        return False
    content = path.read_text(encoding="utf-8")
    # Remove UTF-8 BOM if present
    if content.startswith("\ufeff"):
        content = content.lstrip("\ufeff")
    for raw_line in content.splitlines():
        line = raw_line.strip()
        if not line or line.startswith("#"):
            continue
        if line.startswith("export "):
            line = line[len("export ") :].lstrip()
        if "=" not in line:
            continue
        key, value = line.split("=", 1)
        key = key.strip()
        value = value.strip()
        if not key:
            continue
        if len(value) >= 2 and value[0] == value[-1] and value[0] in ("'", '"'):
            value = value[1:-1]
        if not override and key in os.environ:
            continue
        os.environ[key] = value
    return True
 def load_llm_fsm_dotenv(*, override: bool = False, filename: str = ".env") -> bool:
    """
    Convenience loader for `.env` next to `scripts/llm_fsm` runner scripts.
    """
    dotenv_path = Path(__file__).resolve().parent / filename
    return load_dotenv_into_environ(dotenv_path, override=override)
--- a/llm_fsm_multi_env.py
+++ b/llm_fsm_multi_env.py
@ -0,0 +1,677 @@
 # llm_fsm_multi_env.py
 from __future__ import annotations
 from dataclasses import dataclass
 from typing import Any, Dict, List, Literal, Optional, Tuple
 import torch
 # --------------------------
 # Types
 # --------------------------
 Vec3T = torch.Tensor       # (N,3)
 QuatT = torch.Tensor       # (N,4) wxyz
 MaskT = torch.Tensor       # (N,) bool
 SkillName = Literal[
    "pick", "release", "place", "drop",
    "align", "insert", "remove",
    "rotate", "rotate_until_limit",
    "fasten", "loosen",
    "open", "close",
    "clamp", "unclamp",
    "press", "toggle",
    "insert_into", "remove_from",
    "regrasp", "adjust_pose",
 ]
 PredicateType = Literal[
    "is_grasped",
    "object_on_surface",
    "object_in_container",
    "object_in_fixture",
    "pose_in_tolerance",
    "depth_in_range",
    "fixture_state",
    "button_pressed",
    "switch_state",
    "thread_engaged",
 ]
 # --------------------------
 # Spec dataclasses
 # --------------------------
@dataclass
 class SkillSpec:
    name: SkillName
    args: Dict[str, Any]
@dataclass
 class PredicateSpec:
    type: PredicateType
    args: Dict[str, Any]  # free-form params
@dataclass
 class GoalSpec:
    summary: str
    success_conditions: List[PredicateSpec]
@dataclass
 class TaskSpec:
    task_id: str
    activity: str
    task_name: str
    skills: List[SkillSpec]
    goal: GoalSpec
    @staticmethod
    def from_dict(task: Dict[str, Any]) -> "TaskSpec":
        skills_in = task.get("skills", [])
        skills: List[SkillSpec] = []
        for s in skills_in:
            if not isinstance(s, dict):
                raise TypeError(f"Skill entry must be a dict, got: {type(s)}")
            skills.append(SkillSpec(name=s["name"], args=dict(s.get("args", {}))))
        goal_in = task.get("goal", {})
        preds_in = goal_in.get("success_conditions", [])
        preds: List[PredicateSpec] = []
        for p in preds_in:
            if not isinstance(p, dict):
                raise TypeError(f"Predicate entry must be a dict, got: {type(p)}")
            p_type = p["type"]
            p_args = dict(p)
            p_args.pop("type", None)
            preds.append(PredicateSpec(type=p_type, args=p_args))
        goal = GoalSpec(summary=goal_in.get("summary", ""), success_conditions=preds)
        return TaskSpec(
            task_id=task.get("task_id", ""),
            activity=task.get("activity", ""),
            task_name=task.get("task_name", ""),
            skills=skills,
            goal=goal,
        )
 # --------------------------
 # Minimal Batched Env API (YOU implement these)
 # --------------------------
 class BatchedEnvAPI:
    """
    You adapt this to your IsaacLab env.
    Required to be batched over num_envs (N).
    All returned tensors are on the same device as env (typically CUDA).
    """
    device: torch.device
    num_envs: int
    # --- asset queries ---
    def get_pose_w(self, name: str) -> tuple[Vec3T, QuatT]:
        """Return pose of an entity by name: pos (N,3), quat (N,4) wxyz."""
        raise NotImplementedError
    def contains(self, fixture_or_container: str, obj: str) -> MaskT:
        """Return (N,) bool if obj is in fixture/container region."""
        raise NotImplementedError
    def fixture_state(self, fixture: str, state_name: str) -> Any:
        """
        Return a batched state. Common choices:
          - bool tensor (N,) for open/closed
          - float tensor (N,) for joint position / open ratio
          - int tensor (N,) for discrete states
        """
        raise NotImplementedError
    def button_pressed(self, fixture: str, button: str) -> MaskT:
        raise NotImplementedError
    def switch_state(self, fixture: str, switch: str) -> Any:
        raise NotImplementedError
    # --- stepping / resets ---
    def step_physics(self, action: Optional[torch.Tensor] = None) -> None:
        """Advance sim one step. action can be dummy if you drive controllers elsewhere."""
        raise NotImplementedError
    def reset(self, env_ids: Optional[torch.Tensor] = None) -> None:
        """Reset all envs if env_ids is None else only subset env_ids (1D int tensor)."""
        raise NotImplementedError
 # --------------------------
 # Robot Facade (Batched) - YOU wire to IK/hand control
 # --------------------------
@dataclass
 class MoveResultBatched:
    reached: MaskT  # (N,) bool
 class RobotFacadeBatched:
    """
    Replace internals with your actual IsaacLab controllers.
    This interface is batched: everything operates on all envs, masked by active_mask.
    """
    def __init__(self, env: BatchedEnvAPI):
        self.env = env
        self.device = env.device
        self.N = env.num_envs
        # TODO: create & store your DifferentialIKController / hand joint controllers here
        # self.ik = DifferentialIKController(...)
        # self.hand = ...
    def get_ee_pose_w(self) -> tuple[Vec3T, QuatT]:
        """Return EE pose (N,3),(N,4)."""
        raise NotImplementedError
    def is_grasped(self, object_name: str) -> MaskT:
        """Return (N,) grasp status. Implement using contact sensors + relative pose."""
        raise NotImplementedError
    def move_ee_pose(
        self,
        pos_w: Vec3T,
        quat_w: QuatT,
        active_mask: Optional[MaskT] = None,
        pos_tol: float = 0.01,
        rot_tol: float = 0.2,
    ) -> MoveResultBatched:
        """
        Move EE toward target pose for envs in active_mask.
        Return reached mask for ALL envs; unreachable envs should be False.
        """
        if active_mask is None:
            active_mask = torch.ones(self.N, device=self.device, dtype=torch.bool)
        # TODO: implement your IK step here:
        # - compute joint targets for active envs
        # - write into controllers / action buffer
        # - evaluate reached: compare current ee pose vs target
        # Placeholder: pretend reached immediately for active envs
        reached = torch.zeros(self.N, device=self.device, dtype=torch.bool)
        reached[active_mask] = True
        return MoveResultBatched(reached=reached)
    def open_hand(self, active_mask: Optional[MaskT] = None) -> None:
        if active_mask is None:
            active_mask = torch.ones(self.N, device=self.device, dtype=torch.bool)
        # TODO: set finger joint targets open for active envs
        return
    def close_hand(self, active_mask: Optional[MaskT] = None) -> None:
        if active_mask is None:
            active_mask = torch.ones(self.N, device=self.device, dtype=torch.bool)
        # TODO: set finger joint targets close for active envs
        return
    def push_along_axis(
        self,
        start_pos_w: Vec3T,
        quat_w: QuatT,
        axis_w: Vec3T,
        dist: float,
        active_mask: Optional[MaskT] = None,
        pos_tol: float = 0.01,
        rot_tol: float = 0.2,
    ) -> MoveResultBatched:
        """Target = start + axis*dist."""
        target = start_pos_w + axis_w * dist
        return self.move_ee_pose(target, quat_w, active_mask=active_mask, pos_tol=pos_tol, rot_tol=rot_tol)
 # --------------------------
 # Success Evaluator (Batched)
 # --------------------------
 class SuccessEvaluatorBatched:
    def __init__(self, env: BatchedEnvAPI, robot: RobotFacadeBatched, predicates: List[PredicateSpec]):
        self.env = env
        self.robot = robot
        self.predicates = predicates
        self.device = env.device
        self.N = env.num_envs
    def check(self) -> MaskT:
        """Return success mask (N,)."""
        if len(self.predicates) == 0:
            return torch.zeros(self.N, device=self.device, dtype=torch.bool)
        ok = torch.ones(self.N, device=self.device, dtype=torch.bool)
        for p in self.predicates:
            ok = ok & self._eval(p)
        return ok
    def _eval(self, p: PredicateSpec) -> MaskT:
        t = p.type
        a = p.args
        if t == "is_grasped":
            return self.robot.is_grasped(a["object"])
        if t == "object_in_fixture":
            return self.env.contains(a["fixture"], a["object"])
        if t == "object_in_container":
            return self.env.contains(a["container"], a["object"])
        if t == "fixture_state":
            cur = self.env.fixture_state(a["fixture"], a["state_name"])
            # common: cur is bool tensor
            if torch.is_tensor(cur):
                return cur == torch.tensor(a["value"], device=cur.device, dtype=cur.dtype)
            # if not tensor, you can adapt here
            raise TypeError("fixture_state must return a tensor for batched evaluator")
        if t == "button_pressed":
            return self.env.button_pressed(a["fixture"], a["button"])
        if t == "switch_state":
            cur = self.env.switch_state(a["fixture"], a["switch"])
            if torch.is_tensor(cur):
                # value might be str -> you need mapping; keep it tensor-based in env
                return cur == torch.tensor(a["value"], device=cur.device, dtype=cur.dtype)
            raise TypeError("switch_state must return a tensor for batched evaluator")
        if t == "pose_in_tolerance":
            pos, _ = self.env.get_pose_w(a["object"])
            tgt_pos, _ = self.env.get_pose_w(a["target_frame"])
            pos_tol = float(a.get("pos_tol", 0.02))
            d = torch.linalg.norm(pos - tgt_pos, dim=-1)
            return d <= pos_tol
        if t == "depth_in_range":
            obj_pos, _ = self.env.get_pose_w(a["object"])
            hole_pos, _ = self.env.get_pose_w(a["fixture"])
            axis = a.get("axis_w", [0.0, 0.0, 1.0])
            axis_w = torch.tensor(axis, device=self.device, dtype=obj_pos.dtype).view(1, 3).repeat(self.N, 1)
            depth = torch.sum((obj_pos - hole_pos) * axis_w, dim=-1)
            return (depth >= float(a["min_depth"])) & (depth <= float(a["max_depth"]))
        # optional ones not implemented here:
        if t in ("object_on_surface", "thread_engaged"):
            return torch.zeros(self.N, device=self.device, dtype=torch.bool)
        raise ValueError(f"Unknown predicate type: {t}")
 # --------------------------
 # Batched Skills
 #   - Each skill keeps per-env internal phase/timers as tensors.
 #   - step(active_mask) returns done_mask for ALL envs (True only for envs that finished this skill).
 # --------------------------
@dataclass
 class SkillContext:
    env: BatchedEnvAPI
    robot: RobotFacadeBatched
 class BaseSkillBatched:
    def __init__(self, ctx: SkillContext):
        self.ctx = ctx
        self.device = ctx.env.device
        self.N = ctx.env.num_envs
        self.phase = torch.zeros(self.N, device=self.device, dtype=torch.long)  # per-env phase
    def reset(self, enter_mask: MaskT) -> None:
        """Called when some envs enter this skill (idx changes to this skill)."""
        self.phase[enter_mask] = 0
    def step(self, active_mask: MaskT) -> MaskT:
        raise NotImplementedError
 class PickSkillBatched(BaseSkillBatched):
    def __init__(self, ctx: SkillContext, object_name: str, pregrasp_z: float = 0.08):
        super().__init__(ctx)
        self.object_name = object_name
        self.pregrasp_z = pregrasp_z
    def step(self, active_mask: MaskT) -> MaskT:
        done = torch.zeros(self.N, device=self.device, dtype=torch.bool)
        # phase 0: move to pregrasp
        m0 = active_mask & (self.phase == 0)
        if m0.any():
            obj_pos, obj_quat = self.ctx.env.get_pose_w(self.object_name)
            target_pos = obj_pos.clone()
            target_pos[m0, 2] = obj_pos[m0, 2] + self.pregrasp_z
            r = self.ctx.robot.move_ee_pose(target_pos, obj_quat, active_mask=m0)
            reached = r.reached & m0
            self.phase[reached] = 1
        # phase 1: close hand (one-shot)
        m1 = active_mask & (self.phase == 1)
        if m1.any():
            self.ctx.robot.close_hand(active_mask=m1)
            self.phase[m1] = 2
        # phase 2: verify
        m2 = active_mask & (self.phase == 2)
        if m2.any():
            grasped = self.ctx.robot.is_grasped(self.object_name) & m2
            done[grasped] = True
            # keep phase=2 for those not yet grasped (could add timeout logic)
        return done
 class ReleaseSkillBatched(BaseSkillBatched):
    def __init__(self, ctx: SkillContext, object_name: str):
        super().__init__(ctx)
        self.object_name = object_name
    def step(self, active_mask: MaskT) -> MaskT:
        done = torch.zeros(self.N, device=self.device, dtype=torch.bool)
        m0 = active_mask & (self.phase == 0)
        if m0.any():
            self.ctx.robot.open_hand(active_mask=m0)
            self.phase[m0] = 1
        # immediate done (optionally verify not grasped)
        m1 = active_mask & (self.phase == 1)
        done[m1] = True
        return done
 class PlaceSkillBatched(BaseSkillBatched):
    def __init__(self, ctx: SkillContext, object_name: str, target_name: str, above_z: float = 0.10):
        super().__init__(ctx)
        self.object_name = object_name
        self.target_name = target_name
        self.above_z = above_z
    def step(self, active_mask: MaskT) -> MaskT:
        done = torch.zeros(self.N, device=self.device, dtype=torch.bool)
        # phase 0: move above target
        m0 = active_mask & (self.phase == 0)
        if m0.any():
            tgt_pos, tgt_quat = self.ctx.env.get_pose_w(self.target_name)
            above = tgt_pos.clone()
            above[m0, 2] = tgt_pos[m0, 2] + self.above_z
            r = self.ctx.robot.move_ee_pose(above, tgt_quat, active_mask=m0)
            reached = r.reached & m0
            self.phase[reached] = 1
        # phase 1: move down to target
        m1 = active_mask & (self.phase == 1)
        if m1.any():
            tgt_pos, tgt_quat = self.ctx.env.get_pose_w(self.target_name)
            r = self.ctx.robot.move_ee_pose(tgt_pos, tgt_quat, active_mask=m1)
            reached = r.reached & m1
            self.phase[reached] = 2
        # phase 2: open hand then done
        m2 = active_mask & (self.phase == 2)
        if m2.any():
            self.ctx.robot.open_hand(active_mask=m2)
            done[m2] = True
        return done
 class AlignSkillBatched(BaseSkillBatched):
    """
    Placeholder alignment: go to pre-insert pose above fixture frame.
    Replace internally with your pinch-axis + face selection + micro-adjust.
    """
    def __init__(self, ctx: SkillContext, object_name: str, target_fixture: str, standoff_z: float = 0.06):
        super().__init__(ctx)
        self.object_name = object_name
        self.target_fixture = target_fixture
        self.standoff_z = standoff_z
    def step(self, active_mask: MaskT) -> MaskT:
        done = torch.zeros(self.N, device=self.device, dtype=torch.bool)
        m0 = active_mask & (self.phase == 0)
        if m0.any():
            hole_pos, hole_quat = self.ctx.env.get_pose_w(self.target_fixture)
            pre = hole_pos.clone()
            pre[m0, 2] = hole_pos[m0, 2] + self.standoff_z
            r = self.ctx.robot.move_ee_pose(pre, hole_quat, active_mask=m0)
            reached = r.reached & m0
            done[reached] = True
        return done
 class InsertSkillBatched(BaseSkillBatched):
    """
    Placeholder insertion: move to pre, then push along -Z.
    Replace axis with fixture insertion axis, and add contact-based micro-adjust.
    """
    def __init__(self, ctx: SkillContext, object_name: str, target_fixture: str, pre_z: float = 0.03, depth: float = 0.02):
        super().__init__(ctx)
        self.object_name = object_name
        self.target_fixture = target_fixture
        self.pre_z = pre_z
        self.depth = depth
    def step(self, active_mask: MaskT) -> MaskT:
        done = torch.zeros(self.N, device=self.device, dtype=torch.bool)
        # phase 0: pre-insert
        m0 = active_mask & (self.phase == 0)
        if m0.any():
            hole_pos, hole_quat = self.ctx.env.get_pose_w(self.target_fixture)
            pre = hole_pos.clone()
            pre[m0, 2] = hole_pos[m0, 2] + self.pre_z
            r = self.ctx.robot.move_ee_pose(pre, hole_quat, active_mask=m0)
            reached = r.reached & m0
            self.phase[reached] = 1
        # phase 1: push along axis
        m1 = active_mask & (self.phase == 1)
        if m1.any():
            hole_pos, hole_quat = self.ctx.env.get_pose_w(self.target_fixture)
            start = hole_pos.clone()
            start[m1, 2] = hole_pos[m1, 2] + self.pre_z
            axis_w = torch.zeros((self.N, 3), device=self.device, dtype=hole_pos.dtype)
            axis_w[:, 2] = -1.0
            r = self.ctx.robot.push_along_axis(start, hole_quat, axis_w, self.depth, active_mask=m1)
            reached = r.reached & m1
            done[reached] = True
        return done
 # --------------------------
 # Skill Factory (Batched)
 # --------------------------
 def build_skill_batched(ctx: SkillContext, spec: SkillSpec) -> BaseSkillBatched:
    n = spec.name
    a = spec.args
    if n == "pick":
        return PickSkillBatched(ctx, a["object"])
    if n == "release":
        return ReleaseSkillBatched(ctx, a["object"])
    if n == "place":
        return PlaceSkillBatched(ctx, a["object"], a["target"])
    if n == "align":
        return AlignSkillBatched(ctx, a["object"], a["target_fixture"])
    if n == "insert":
        depth = float(a.get("depth", 0.02))
        return InsertSkillBatched(ctx, a["object"], a["target_fixture"], depth=depth)
    raise NotImplementedError(f"Skill not implemented (batched): {n}")
 # --------------------------
 # Batched Skill FSM
 # --------------------------
 class SkillFSMBatched:
    """
    One task_spec replicated across N envs.
    Maintain env-wise idx; execute appropriate skill for env subsets.
    """
    def __init__(self, ctx: SkillContext, skill_specs: List[SkillSpec]):
        self.ctx = ctx
        self.device = ctx.env.device
        self.N = ctx.env.num_envs
        self.skill_specs = skill_specs
        self.K = len(skill_specs)
        # Prebuild all skill objects (K of them), each with per-env phase tensor
        self.skills: List[BaseSkillBatched] = [build_skill_batched(ctx, s) for s in skill_specs]
        # env-wise pointer
        self.idx = torch.zeros(self.N, device=self.device, dtype=torch.long)  # current skill index per env
        self.done = torch.zeros(self.N, device=self.device, dtype=torch.bool)  # whether sequence finished
    def reset(self, env_ids: Optional[torch.Tensor] = None) -> None:
        """Reset FSM for all envs or subset."""
        if env_ids is None:
            mask = torch.ones(self.N, device=self.device, dtype=torch.bool)
        else:
            mask = torch.zeros(self.N, device=self.device, dtype=torch.bool)
            mask[env_ids] = True
        self.idx[mask] = 0
        self.done[mask] = False
        # envs enter skill 0
        self.skills[0].reset(mask)
    def step(self, active_mask: MaskT) -> MaskT:
        """
        Advance one tick for envs in active_mask.
        Returns seq_done_mask (N,) indicating which envs have finished all skills.
        """
        # Don't run already finished envs
        run_mask = active_mask & (~self.done)
        if not run_mask.any():
            return self.done.clone()
        # For each skill k, run for envs where idx==k
        for k in range(self.K):
            mk = run_mask & (self.idx == k)
            if not mk.any():
                continue
            skill_done = self.skills[k].step(mk)  # returns (N,)
            finished_here = mk & skill_done
            if finished_here.any():
                # advance idx
                next_idx = k + 1
                if next_idx >= self.K:
                    # sequence finished
                    self.done[finished_here] = True
                else:
                    self.idx[finished_here] = next_idx
                    # envs "enter" next skill => reset its internal phase for these envs
                    self.skills[next_idx].reset(finished_here)
        return self.done.clone()
 # --------------------------
 # Compiled Task Bundle (Batched)
 # --------------------------
@dataclass
 class CompiledTaskBatched:
    env: BatchedEnvAPI
    robot: RobotFacadeBatched
    fsm: SkillFSMBatched
    evaluator: SuccessEvaluatorBatched
 # --------------------------
 # Compiler (Batched)
 # --------------------------
 class LLMFSMCompilerBatched:
    def compile(self, env: BatchedEnvAPI, task_spec: TaskSpec) -> CompiledTaskBatched:
        robot = RobotFacadeBatched(env)
        ctx = SkillContext(env=env, robot=robot)
        fsm = SkillFSMBatched(ctx, task_spec.skills)
        evaluator = SuccessEvaluatorBatched(env, robot, task_spec.goal.success_conditions)
        # full reset
        fsm.reset()
        return CompiledTaskBatched(env=env, robot=robot, fsm=fsm, evaluator=evaluator)
 # --------------------------
 # Runner loop (multi-env)
 # --------------------------
 def run_compiled_task_multi_env(
    compiled: CompiledTaskBatched,
    max_steps: int = 2000,
    auto_reset_success: bool = False,
 ) -> Dict[str, Any]:
    env = compiled.env
    N = env.num_envs
    device = env.device
    # initial reset
    env.reset()
    compiled.fsm.reset()
    success = torch.zeros(N, device=device, dtype=torch.bool)
    for t in range(max_steps):
        # 1) check success before step (optional)
        success_now = compiled.evaluator.check()
        success = success | success_now
        # 2) active envs = not success and not fsm-done (you can choose policy)
        active = (~success) & (~compiled.fsm.done)
        # 3) advance FSM for active envs
        compiled.fsm.step(active)
        # 4) physics step
        env.step_physics(action=None)
        # 5) optional: auto-reset envs that succeeded (common for dataset generation)
        if auto_reset_success and success_now.any():
            env_ids = torch.nonzero(success_now, as_tuple=False).squeeze(-1)
            env.reset(env_ids)
            compiled.fsm.reset(env_ids)
            success[env_ids] = False  # start new episode for those envs
        # early stop: all envs succeeded or finished
        if ((success | compiled.fsm.done).all()):
            break
    return {
        "success_mask": success.detach().clone(),
        "fsm_done_mask": compiled.fsm.done.detach().clone(),
        "steps": t + 1,
    }
 # --------------------------
 # Example: constructing TaskSpec (no JSON parser here)
 # --------------------------
 def make_example_task_spec() -> TaskSpec:
    skills = [
        SkillSpec("pick", {"object": "peg_small"}),
        SkillSpec("align", {"object": "peg_small", "target_fixture": "alignment_jig_hole"}),
        SkillSpec("insert", {"object": "peg_small", "target_fixture": "alignment_jig_hole", "depth": 0.02}),
        SkillSpec("release", {"object": "peg_small"}),
    ]
    preds = [
        PredicateSpec("object_in_fixture", {"object": "peg_small", "fixture": "alignment_jig_hole"}),
        PredicateSpec("depth_in_range", {"object": "peg_small", "fixture": "alignment_jig_hole", "min_depth": 0.018, "max_depth": 0.022, "axis_w": [0, 0, 1]}),
    ]
    return TaskSpec(
        task_id="peg_seat_001",
        activity="Peg Alignment & Seating",
        task_name="Insert Small Peg into Alignment Jig",
        skills=skills,
        goal=GoalSpec(summary="Insert peg into jig", success_conditions=preds),
    )
--- a/llm_task_generator.py
+++ b/llm_task_generator.py
@ -0,0 +1,246 @@
 # llm_task_generator_activity.py
 from __future__ import annotations
 import os
 import json
 from typing import Any, Dict, List, Optional
 from openai import OpenAI
 # -----------------------------
 # OpenAI client / model
 # -----------------------------
 def _get_openai_client() -> "OpenAI":
    if OpenAI is None:
        raise RuntimeError(
            "Python package `openai` is not installed. Install it (e.g. `pip install openai`) "
            "to use generate_task_spec_from_activity()."
        )
    return OpenAI(api_key=os.environ.get("OPENAI_API_KEY"))
 MODEL_NAME = "gpt-4.1-mini"   # 필요 시 "gpt-4.1"로 변경
 # -----------------------------
 # Output contract (TaskSpec JSON)
 # -----------------------------
 TASK_SCHEMA_DESCRIPTION = """
 Output JSON ONLY (no markdown, no comments), with this exact structure:
 {
  "task_id": string,
  "activity": string,
  "task_name": string,
  "skills": [
    { "name": string, "args": object }
  ],
  "goal": {
    "summary": string,
    "success_conditions": [
      { "type": string, ...predicate args... }
    ]
  }
 }
 Rules:
 - Use only allowed objects/fixtures/containers/tools provided.
 - Use only allowed skills provided.
 - Use only allowed goal predicates provided.
 - Steps must be between min_steps and max_steps (inclusive).
 - Do NOT output coordinates, poses, or any continuous control targets.
 - Ensure preconditions: pick(object) must occur before place/align/insert/release for that object.
 - Skill args must use the EXACT keys specified in the "Skill argument schema" section of the prompt.
 """
 DEFAULT_ALLOWED_SKILLS = [
    "pick", "release", "place",
    "align", "insert",
 ]
 DEFAULT_ALLOWED_PREDICATES = [
    "is_grasped",
    "object_in_fixture",
    "object_in_container",
    "pose_in_tolerance",
    "depth_in_range",
    "fixture_state",
    "button_pressed",
    "switch_state",
    "thread_engaged",
 ]
 SKILL_ARG_SCHEMA: Dict[str, Dict[str, List[str]]] = {
    "pick": {"required": ["object"], "optional": []},
    "release": {"required": ["object"], "optional": []},
    "place": {"required": ["object", "target"], "optional": []},
    "align": {"required": ["object", "target_fixture"], "optional": []},
    "insert": {"required": ["object", "target_fixture"], "optional": ["depth"]},
 }
 def _format_skill_arg_schema(allowed_skills: List[str]) -> str:
    lines: List[str] = []
    for skill_name in allowed_skills:
        spec = SKILL_ARG_SCHEMA.get(skill_name)
        if spec is None:
            continue
        req = ", ".join(spec["required"]) if spec["required"] else "(none)"
        opt = ", ".join(spec["optional"]) if spec["optional"] else "(none)"
        lines.append(f'- {skill_name}: required args = [{req}], optional args = [{opt}]')
    if not lines:
        return "- (no schema available)"
    return "\n".join(lines)
 def _normalize_task_spec(task: Dict[str, Any]) -> Dict[str, Any]:
    skills = task.get("skills", [])
    if not isinstance(skills, list):
        return task
    for s in skills:
        if not isinstance(s, dict):
            continue
        name = s.get("name")
        args = s.get("args", {})
        if not isinstance(args, dict):
            args = {}
        if name in ("align", "insert"):
            if "target_fixture" not in args and "fixture" in args:
                args["target_fixture"] = args.pop("fixture")
        if name == "place":
            if "target" not in args and "fixture" in args:
                args["target"] = args.pop("fixture")
        s["args"] = args
    return task
 def _build_task_prompt_from_activity(
    activity_key: str,
    activity_def: Dict[str, Any],
    *,
    allowed_skills: List[str],
    allowed_predicates: List[str],
    min_steps: int,
    max_steps: int,
 ) -> str:
    desc = activity_def.get("description", "")
    objs = activity_def.get("allowed_objects", [])
    fxs = activity_def.get("allowed_fixtures", [])
    containers = activity_def.get("allowed_containers", [])
    tools = activity_def.get("allowed_tools", [])
    tags = activity_def.get("difficulty_tags", [])
    # activity-specific overrides are allowed
    activity_skills = activity_def.get("allowed_skills", allowed_skills)
    activity_preds = activity_def.get("allowed_predicates", allowed_predicates)
    return f"""
 You are generating a robotics task specification for a WORKBENCH dexterous manipulation setup.
 SELECTED ACTIVITY KEY: {activity_key}
 Activity description: {desc}
 Difficulty tags: {tags}
 Allowed entities:
 - objects: {objs}
 - fixtures: {fxs}
 - containers: {containers}
 - tools: {tools}
 Allowed skills (use EXACT names):
 {activity_skills}
 Allowed goal predicates (use EXACT names):
 {activity_preds}
 Skill argument schema (MUST follow EXACT arg keys):
 {_format_skill_arg_schema(activity_skills)}
 Hard constraints:
 - Output JSON only.
 - Do not invent new entities (must be from allowed lists).
 - Do not invent new skills/predicates.
 - Steps must be between {min_steps} and {max_steps}.
 - Must satisfy skill preconditions:
  * pick(object) must happen before align/insert/place/release for that object
  * release(object) should only happen after object was picked
 - No coordinates, no poses, no numeric target positions in skills.
 {TASK_SCHEMA_DESCRIPTION}
 Now generate ONE task JSON. Make it unique, concrete, and feasible for the selected activity.
 """
 def _parse_json_strict(text: str) -> Dict[str, Any]:
    text = text.strip()
    # minimal cleanup for cases with accidental code fences
    if text.startswith("```"):
        text = text.strip("`")
        # try to remove language hint
        lines = text.splitlines()
        if lines and lines[0].lower().startswith("json"):
            text = "\n".join(lines[1:])
    try:
        return json.loads(text)
    except json.JSONDecodeError as e:
        raise RuntimeError(f"LLM output was not valid JSON.\n---\n{text}\n---") from e
 def generate_task_spec_from_activity(
    activity_key: str,
    activity_def: Dict[str, Any],
    *,
    model: str = MODEL_NAME,
    temperature: float = 0.2,
    max_output_tokens: int = 900,
    min_steps: int = 5,
    max_steps: int = 10,
    allowed_skills: Optional[List[str]] = None,
    allowed_predicates: Optional[List[str]] = None,
 ) -> Dict[str, Any]:
    """
    Generate ONE TaskSpec JSON dict for a pre-defined activity.
    Returns a dict like:
      { task_id, activity, task_name, skills:[...], goal:{summary, success_conditions:[...]} }
    """
    if allowed_skills is None:
        allowed_skills = DEFAULT_ALLOWED_SKILLS
    if allowed_predicates is None:
        allowed_predicates = DEFAULT_ALLOWED_PREDICATES
    prompt = _build_task_prompt_from_activity(
        activity_key,
        activity_def,
        allowed_skills=allowed_skills,
        allowed_predicates=allowed_predicates,
        min_steps=min_steps,
        max_steps=max_steps,
    )
    client = _get_openai_client()
    resp = client.responses.create(
        model=model,
        input=[
            {"role": "system", "content": "You output strictly valid JSON task specs for robotics. No extra text."},
            {"role": "user", "content": prompt},
        ],
        temperature=temperature,
        max_output_tokens=max_output_tokens,
    )
    task = _parse_json_strict(resp.output_text)
    task = _normalize_task_spec(task)
    # Ensure activity field matches selected activity_key (stability)
    task["activity"] = activity_key
    if "task_id" not in task or not task["task_id"]:
        task["task_id"] = f"{activity_key}_auto_0001"
    if "task_name" not in task or not task["task_name"]:
        task["task_name"] = task["task_id"]
    return task
--- a/llm_task_validator.py
+++ b/llm_task_validator.py
@ -0,0 +1,37 @@
 from typing import Dict, Any
 ALLOWED_SKILLS = {
    "pick": ["object"],
    "align": ["object", "target_fixture"],
    "insert": ["object", "target_fixture"],
    "release": ["object"],
 }
 ALLOWED_PREDICATES = {
    "object_in_fixture",
    "depth_in_range",
    "pose_in_tolerance",
 }
 def validate_task_spec(task: Dict[str, Any]) -> None:
    assert "skills" in task
    assert "goal" in task
    # ---- skills ----
    for s in task["skills"]:
        name = s["name"]
        args = s.get("args", {})
        if name not in ALLOWED_SKILLS:
            raise ValueError(f"Unknown skill: {name}")
        required_args = ALLOWED_SKILLS[name]
        for k in required_args:
            if k not in args:
                raise ValueError(f"Skill {name} missing arg: {k}")
    # ---- predicates ----
    for p in task["goal"]["success_conditions"]:
        if p["type"] not in ALLOWED_PREDICATES:
            raise ValueError(f"Unknown predicate: {p['type']}")
--- a/run.py
+++ b/run.py
@ -0,0 +1,65 @@
 import argparse
 import random
 from pathlib import Path
 from dotenv_loader import load_dotenv_into_environ
 from task_activities import WORKBENCH_ACTIVITIES
 # --------------------------------
 # Example workflow
 # --------------------------------
 def main():
    parser = argparse.ArgumentParser()
    parser.add_argument(
        "activity",
        nargs="?",
        help="Activity key to run (defaults to random).",
    )
    args = parser.parse_args()
    # Load `.env` from this folder into `os.environ` before importing OpenAI client code.
    load_dotenv_into_environ(Path(__file__).resolve().parent / ".env", override=False)
    from llm_task_generator import generate_task_spec_from_activity
    from llm_task_validator import ALLOWED_PREDICATES, ALLOWED_SKILLS, validate_task_spec
    from llm_fsm_multi_env import (
        TaskSpec,
        LLMFSMCompilerBatched,
        run_compiled_task_multi_env,
    )
    # 1) select activity
    if args.activity is not None:
        if args.activity not in WORKBENCH_ACTIVITIES:
            available = ", ".join(sorted(WORKBENCH_ACTIVITIES.keys()))
            raise SystemExit(f"Unknown activity `{args.activity}`. Available: {available}")
        activity_key = args.activity
    else:
        activity_key = random.choice(list(WORKBENCH_ACTIVITIES.keys()))
    activity_def = WORKBENCH_ACTIVITIES[activity_key]
    # 2) generate task under this activity
    task_dict = generate_task_spec_from_activity(
        activity_key,
        activity_def,
        allowed_skills=list(ALLOWED_SKILLS.keys()),
        allowed_predicates=sorted(ALLOWED_PREDICATES),
    )
    validate_task_spec(task_dict)
    # 3) convert dict → TaskSpec dataclass
    task_spec = TaskSpec.from_dict(task_dict)
    # 4) compile & run
    compiler = LLMFSMCompilerBatched()
    compiled = compiler.compile(env=batched_env, task_spec=task_spec)
    # result = run_compiled_task_multi_env(compiled)
    # print("Result:", result)
 if __name__ == "__main__":
    main()
--- a/task_activities.py
+++ b/task_activities.py
@ -0,0 +1,35 @@
 from __future__ import annotations
 # activities.py
 WORKBENCH_ACTIVITIES = {
    "peg_alignment": {
        "description": "Aligning and inserting pegs into fixed jigs or holes.",
        "allowed_objects": ["peg_small", "peg_large"],
        "allowed_fixtures": ["alignment_jig_hole"],
        "difficulty_tags": ["alignment", "insertion"],
    },
    "loose_fastening": {
        "description": "Loosely fastening bolts into nut plates without full tightening.",
        "allowed_objects": ["bolt_m3"],
        "allowed_fixtures": ["nut_plate_hole"],
        "difficulty_tags": ["threading", "rotation"],
    },
    "key_lock_rotation": {
        "description": "Inserting a key and rotating it until a mechanical stop.",
        "allowed_objects": ["flat_key"],
        "allowed_fixtures": ["lock_slot"],
        "difficulty_tags": ["insertion", "limited_rotation"],
    },
    "drawer_interaction": {
        "description": "Opening drawers and moving parts in or out.",
        "allowed_objects": ["small_gear"],
        "allowed_fixtures": ["drawer"],
        "difficulty_tags": ["fixture", "occlusion"],
    },
 }