feat: random with boundary

feat: random explore
2024-04-29 02:39:46 +08:00 · 2024-04-29 02:19:06 +08:00
4 changed files with 114 additions and 7 deletions
--- a/nav_src/NavGPT.py
+++ b/nav_src/NavGPT.py
@ -8,7 +8,7 @@ from utils.logger import write_to_record_file
 from utils.data import ImageObservationsDB
 from parser import parse_args
 from env import REVERIENavBatch
-from agent import NavGPTAgent
+from agent import NavGPTAgent, RandomAgent

 def build_dataset(args, data_limit=100):

@ -35,7 +35,7 @@ def build_dataset(args, data_limit=100):

 def valid(args, val_envs):

-    agent = NavGPTAgent(next(iter(val_envs.values())), args)
+    agent = RandomAgent(next(iter(val_envs.values())), args)

    with open(os.path.join(args.log_dir, 'validation_args.json'), 'w') as outf:
        json.dump(vars(args), outf, indent=4)
--- a/nav_src/agent.py
+++ b/nav_src/agent.py
@ -5,6 +5,7 @@ import re
 import warnings
 import numpy as np
 from typing import Any, Callable, List, NamedTuple, Optional, Sequence, Tuple, Dict, Union
+import random

 from env import REVERIENavBatch
 from argparse import Namespace
@ -817,3 +818,113 @@ class NavGPTAgent(BaseAgent):

        return self.traj

+class RandomAgent(BaseAgent):
+    def __init__(
+            self, 
+            env: REVERIENavBatch, 
+            config: Namespace):
+        """
+        Initialize the LLM Navigation Agent.
+
+        Args:
+            env: The Matterport3D environment.
+            config: The configuration.
+        """
+        super().__init__(env)
+        self.config = config
+
+
+    def init_trajecotry(self, obs: List[dict]):
+        """Initialize the trajectory with the given observation."""
+        # Record the navigation path
+        self.traj = [{
+            'instr_id': ob['instr_id'],
+            'path': [[ob['start']]],
+            'details': [],
+        } for ob in obs]
+        # Record the history of actions taken
+
+
+    def make_equiv_action(self, actions: List[str]) -> str:
+        """
+        Interface between Panoramic view and Egocentric view
+        Take in the next viewpoint ID and move the agent to that viewpoint
+        return the turned angle and new observation
+        """
+        def normalize_angle(angle):
+            while angle > 180:
+                angle -= 360
+            while angle <= -180:
+                angle += 360
+            return angle
+
+        def angle_to_left_right(angle):
+            return f"left {-angle:.2f}" if angle < 0 else f"right {angle:.2f}"
+        
+        # Get current agent facing angle
+        cur_obs = self.env._get_obs()[0]
+        cur_heading = np.rad2deg(cur_obs['heading'])
+        # Make the action
+        new_obs = self.env.step(actions)[0]
+        new_heading = np.rad2deg(new_obs['heading'])
+        # Record the trajectory
+        self.traj[0]['path'].append(self.env.env.sims[0].gmap.bfs_shortest_path(cur_obs['viewpoint'], actions[0])[1:])
+        # Calculate the turned angle
+        turned_angle = new_heading - cur_heading
+        # Generate action description
+        cur_heading = angle_to_left_right(normalize_angle(cur_heading))
+        new_heading = angle_to_left_right(normalize_angle(new_heading))
+        action_description = f'Turn heading direction {turned_angle:.2f} degrees from {cur_heading} to {new_heading}.'
+        return action_description, new_obs
+
+    def rollout(self, reset=True):
+        if reset:  # Reset env
+            obs = self.env.reset()
+        else:
+            obs = self.env._get_obs()
+
+        global FINAL_STOP_POINT
+        global TEMP_STEPS_COUNTER
+        global STEPS_COUNTER
+        global SUCCESS
+
+        FINAL_STOP_POINT = obs[0]['stop']
+
+        if TEMP_STEPS_COUNTER != 0:
+            TEMP_STEPS_COUNTER = 0
+
+        print("=="*20)
+
+        # Initialize the trajectory
+        self.init_trajecotry(obs)
+
+        for iteration in range(self.config.max_iterations):
+            next_point = None
+            print(obs[0].keys())
+            print(obs[0]['viewpoint'])
+            for i, init_ob in enumerate(obs):
+                navigable = [ k for k, v in init_ob['candidate'].items() ]
+                next_point = random.choice(navigable)
+                print(next_point)
+                turned_angle, obs = self.make_equiv_action([next_point])
+                obs = [obs]
+
+                print(f"TEMP_STEPS_COUNTER={TEMP_STEPS_COUNTER}")
+                print(f"STEPS_COUNTER={STEPS_COUNTER}")
+                TEMP_STEPS_COUNTER += 1
+
+            if next_point == FINAL_STOP_POINT:
+                print("    SUCCESS")
+                STEPS_COUNTER += TEMP_STEPS_COUNTER
+                SUCCESS += 1
+                TEMP_STEPS_COUNTER = 0
+                break
+        
+        print(f"FINAL_STOP_POINT={FINAL_STOP_POINT}")
+        print(f"SUCCESS={SUCCESS}")
+        print(f"TEMP_STEPS_COUNTER={TEMP_STEPS_COUNTER}")
+        print(f"STEPS_COUNTER={STEPS_COUNTER}")
+
+
+
+        return self.traj
--- a/nav_src/agent_base.py
+++ b/nav_src/agent_base.py
@ -14,10 +14,6 @@ class BaseAgent(object):
            output.append({'instr_id': k, 'trajectory': v['path']})
            if detailed_output:
                output[-1]['details'] = v['details']
-                output[-1]['action_plan'] = v['action_plan']
-                output[-1]['llm_output'] = v['llm_output']
-                output[-1]['llm_thought'] = v['llm_thought']
-                output[-1]['llm_observation'] = v['llm_observation']
        return output

    def rollout(self, **args):
--- a/nav_src/env.py
+++ b/nav_src/env.py
@ -136,7 +136,6 @@ class Simulator(object):

        self.node_region, self.region_room, self.region_obj, self.node_locations = load_floorplan()

-
    def newEpisode(
            self, 
            scan_ID: str, 
@ -171,6 +170,7 @@ class Simulator(object):
                print(start_region, to_region)
            print("AFTER: ", len(self.navigable_dict[start]))

+
        # Get candidate
        self.getCandidate()
Author	SHA1	Message	Date
Ting-Jun Wang	32ceca7752	feat: random with boundary	2024-04-29 02:39:46 +08:00
Ting-Jun Wang	5848e22b1e	feat: random explore	2024-04-29 02:19:06 +08:00