From 8d40d43c5a47896ddf91dcef9dc75a1939d0b4b0 Mon Sep 17 00:00:00 2001
From: Caiyishuai <39987654+Caiyishuai@users.noreply.github.com>
Date: Thu, 16 Nov 2023 17:57:27 +0800
Subject: [PATCH] =?UTF-8?q?=E5=A2=9E=E5=8A=A0=20VLM=20=E5=9C=BA=E6=99=AF?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 robowaiter/behavior_lib/_base/Behavior.py     |   2 +
 robowaiter/behavior_lib/act/Make.py           |   2 +-
 robowaiter/behavior_lib/act/MoveTo.py         |   6 +-
 robowaiter/behavior_lib/act/PutDown.py        |   4 +
 robowaiter/behavior_lib/cond/On.py            |   3 +
 .../obtea/OptimalBTExpansionAlgorithm.py      |  30 +++--
 .../behavior_tree/obtea/opt_bt_exp_main.py    |   2 +-
 robowaiter/llm_client/data/test_questions.txt |   2 +-
 .../llm_client/data_raw/test_questions.csv    |   2 +-
 robowaiter/llm_client/data_tools/csv2dict.py  |   1 -
 robowaiter/scene/tasks/{ => VLM}/VLM.py       |   5 +-
 robowaiter/scene/tasks/VLM/VLM2.py            | 123 ++++++++++++++++++
 robowaiter/scene/tasks/VLM/__init__.py        |   0
 sub_task.ptml                                 |   7 +-
 14 files changed, 168 insertions(+), 21 deletions(-)
 rename robowaiter/scene/tasks/{ => VLM}/VLM.py (95%)
 create mode 100644 robowaiter/scene/tasks/VLM/VLM2.py
 create mode 100644 robowaiter/scene/tasks/VLM/__init__.py

diff --git a/robowaiter/behavior_lib/_base/Behavior.py b/robowaiter/behavior_lib/_base/Behavior.py
index 1bd0182..78fa48a 100644
--- a/robowaiter/behavior_lib/_base/Behavior.py
+++ b/robowaiter/behavior_lib/_base/Behavior.py
@@ -33,6 +33,8 @@ class Bahavior(ptree.behaviour.Behaviour):
         'Water': 'Glass',
         'Dessert':'Plate'
     }
+
+
     
     @classmethod
     def get_ins_name(cls,*args):
diff --git a/robowaiter/behavior_lib/act/Make.py b/robowaiter/behavior_lib/act/Make.py
index a730820..88f828e 100644
--- a/robowaiter/behavior_lib/act/Make.py
+++ b/robowaiter/behavior_lib/act/Make.py
@@ -57,6 +57,6 @@ class Make(Act):
         self.scene.state["condition_set"] |= (self.info["add"])
         self.scene.state["condition_set"] -= self.info["del_set"]
 
-        print("condition_set:",self.scene.state["condition_set"])
+        # print("condition_set:",self.scene.state["condition_set"])
 
         return Status.RUNNING
\ No newline at end of file
diff --git a/robowaiter/behavior_lib/act/MoveTo.py b/robowaiter/behavior_lib/act/MoveTo.py
index 43cef8b..6c31ad5 100644
--- a/robowaiter/behavior_lib/act/MoveTo.py
+++ b/robowaiter/behavior_lib/act/MoveTo.py
@@ -21,7 +21,7 @@ class MoveTo(Act):
             info['pre'] |= {f'Exist({arg})'}
         info["add"] = {f'At(Robot,{arg})'}
         info["del_set"] = {f'At(Robot,{place})' for place in cls.valid_args if place != arg}
-        info['cost']=5
+        info['cost']=10
         return info
 
 
@@ -53,8 +53,6 @@ class MoveTo(Act):
                     if obj.name == target_name:
                         obj_info = obj_dict[id]
                         dis = self.scene.cal_distance_to_robot(obj_info.location.X, obj_info.location.Y, obj_info.location.Z)
-                        if id==275:
-                            print("275'dis:",dis)
                         if dis<min_dis:
                             min_dis = dis
                             obj_id = id
@@ -64,7 +62,7 @@ class MoveTo(Act):
             if obj_id == -1:
                 return ptree.common.Status.FAILURE
 
-            print("self.target_place:",self.target_place,"id:",obj_id,"dis:",min_dis)
+            # print("self.target_place:",self.target_place,"id:",obj_id,"dis:",min_dis)
             self.scene.move_to_obj(obj_id=obj_id)
 
             # ä¸ºäº†æ¼”ç¤ºï¼Œå†™æ­»å’–å•¡ä½ç½®
diff --git a/robowaiter/behavior_lib/act/PutDown.py b/robowaiter/behavior_lib/act/PutDown.py
index 6457868..b4e3af0 100644
--- a/robowaiter/behavior_lib/act/PutDown.py
+++ b/robowaiter/behavior_lib/act/PutDown.py
@@ -22,6 +22,8 @@ class PutDown(Act):
         info["pre"] = {f'Holding({arg[0]})',f'At(Robot,{arg[1]})'}
         info["add"] = {f'Holding(Nothing)',f'On({arg[0]},{arg[1]})'}
         info["del_set"] = {f'Holding({arg[0]})'}
+
+        info['cost'] = 100
         return info
 
 
@@ -36,4 +38,6 @@ class PutDown(Act):
 
         self.scene.state["condition_set"] |= (self.info["add"])
         self.scene.state["condition_set"] -= self.info["del_set"]
+
+        print("After PutDown condition_set:",self.scene.state["condition_set"])
         return Status.RUNNING
diff --git a/robowaiter/behavior_lib/cond/On.py b/robowaiter/behavior_lib/cond/On.py
index ea3ff50..0060e2e 100644
--- a/robowaiter/behavior_lib/cond/On.py
+++ b/robowaiter/behavior_lib/cond/On.py
@@ -16,6 +16,9 @@ class On(Cond):
     def _update(self) -> ptree.common.Status:
         # if self.scene.status?
 
+        # print("self.name:",self.name)
+        # print("On: condition_set:",self.scene.state["condition_set"])
+
         if self.name in self.scene.state["condition_set"]:
             return ptree.common.Status.SUCCESS
         else:
diff --git a/robowaiter/behavior_tree/obtea/OptimalBTExpansionAlgorithm.py b/robowaiter/behavior_tree/obtea/OptimalBTExpansionAlgorithm.py
index 6a69783..cf88a21 100644
--- a/robowaiter/behavior_tree/obtea/OptimalBTExpansionAlgorithm.py
+++ b/robowaiter/behavior_tree/obtea/OptimalBTExpansionAlgorithm.py
@@ -105,8 +105,8 @@ class OptBTExpAlgorithm:
                         [copy.deepcopy(pair_node.cond_leaf), copy.deepcopy(pair_node.act_leaf)])
                     subtree.add_child([copy.deepcopy(sequence_structure)])  # subtree æ˜¯å›žä¸æ–­å˜åŒ–çš„ï¼Œå®ƒçš„çˆ¶äº²æ˜¯self.bt
                     # å¢žåŠ å®žæ—¶æ¡ä»¶åˆ¤æ–­ï¼Œæ»¡è¶³æ¡ä»¶å°±ä¸å†æ‰©å±•
-                    if c <= self.scene.state["condition_set"]:
-                        return True
+                    # if c <= self.scene.state["condition_set"]:
+                    #     return True
                 else:
                     subtree.add_child([copy.deepcopy(pair_node.act_leaf)])
 
@@ -138,14 +138,14 @@ class OptBTExpAlgorithm:
                                 break
 
                         if valid:
-                            # æŠŠç¬¦åˆæ¡ä»¶çš„åŠ¨ä½œèŠ‚ç‚¹éƒ½æ”¾åˆ°åˆ—è¡¨é‡Œ
-                            if self.verbose:
-                                print("â€”â€”â€”â€” -- %s ç¬¦åˆæ¡ä»¶æ”¾å…¥åˆ—è¡¨" % actions[i].name)
                             c_attr_node = Leaf(type='cond', content=c_attr, mincost=current_mincost + actions[i].cost)
                             a_attr_node = Leaf(type='act', content=actions[i], mincost=current_mincost + actions[i].cost)
                             cond_anc_pair = CondActPair(cond_leaf=c_attr_node, act_leaf=a_attr_node)
                             self.nodes.append(copy.deepcopy(cond_anc_pair))  # condition node list
                             self.traversed.append(c_attr) # é‡ç‚¹ the set of expanded conditions
+                            # æŠŠç¬¦åˆæ¡ä»¶çš„åŠ¨ä½œèŠ‚ç‚¹éƒ½æ”¾åˆ°åˆ—è¡¨é‡Œ
+                            if self.verbose:
+                                print("â€”â€”â€”â€” -- %s ç¬¦åˆæ¡ä»¶æ”¾å…¥åˆ—è¡¨,å¯¹åº”çš„cä¸º %s" % (actions[i].name,c_attr))
 
         if self.verbose:
             print("ç®—æ³•ç»“æŸï¼\n")
@@ -188,13 +188,23 @@ class OptBTExpAlgorithm:
 
 
     # æ ‘çš„dfs
-    def dfs_ptml(self,parnode):
+    def dfs_ptml(self,parnode,is_root=False):
         for child in parnode.children:
             if isinstance(child, Leaf):
                 if child.type == 'cond':
-                    self.ptml_string += "cond "
-                    c_set_str = '\n cond '.join(map(str, child.content)) + "\n"
-                    self.ptml_string += c_set_str
+
+                    if is_root and len(child.content) > 1:
+                        # æŠŠå¤šä¸ª cond ä¸²èµ·æ¥
+                        self.ptml_string += "sequence{\n"
+                        self.ptml_string += "cond "
+                        c_set_str = '\n cond '.join(map(str, child.content)) + "\n"
+                        self.ptml_string += c_set_str
+                        self.ptml_string += '}\n'
+                    else:
+                        self.ptml_string += "cond "
+                        c_set_str = '\n cond '.join(map(str, child.content)) + "\n"
+                        self.ptml_string += c_set_str
+
                 elif child.type == 'act':
                     if '(' not in child.content.name:
                         self.ptml_string += 'act ' + child.content.name + "()\n"
@@ -212,7 +222,7 @@ class OptBTExpAlgorithm:
 
     def get_ptml(self):
         self.ptml_string = "selector{\n"
-        self.dfs_ptml(self.bt.children[0])
+        self.dfs_ptml(self.bt.children[0],is_root=True)
         self.ptml_string += '}\n'
         return self.ptml_string
 
diff --git a/robowaiter/behavior_tree/obtea/opt_bt_exp_main.py b/robowaiter/behavior_tree/obtea/opt_bt_exp_main.py
index aa07b5d..9a7829f 100644
--- a/robowaiter/behavior_tree/obtea/opt_bt_exp_main.py
+++ b/robowaiter/behavior_tree/obtea/opt_bt_exp_main.py
@@ -31,7 +31,7 @@ class BTOptExpInterface:
         :return: A PTML string representing the outcome of the behavior tree.
         """
         self.goal = goal
-        self.algo = OptBTExpAlgorithm(verbose=True)
+        self.algo = OptBTExpAlgorithm(verbose=False)
         self.algo.clear()
         self.algo.run_algorithm(self.goal, self.actions,self.scene) # è°ƒç”¨ç®—æ³•å¾—åˆ°è¡Œä¸ºæ ‘ä¿å­˜è‡³ algo.bt
         self.ptml_string = self.algo.get_ptml()
diff --git a/robowaiter/llm_client/data/test_questions.txt b/robowaiter/llm_client/data/test_questions.txt
index e0d8ea9..fe0c3bd 100644
--- a/robowaiter/llm_client/data/test_questions.txt
+++ b/robowaiter/llm_client/data/test_questions.txt
@@ -1 +1 @@
-{"æµ‹è¯•VLMï¼šåšä¸€æ¯å’–å•¡": {"Answer": "æµ‹è¯•VLMï¼šåšä¸€æ¯å’–å•¡", "Goal": "{\"On(Coffee,CoffeeTable)\"}"}, "æµ‹è¯•VLMï¼šåšä¸€æ¯å’–å•¡æ”¾åˆ°å§å°ä¸Š": {"Answer": "æµ‹è¯•VLMï¼šåšä¸€æ¯å’–å•¡æ”¾åˆ°å§å°ä¸Š", "Goal": "{\"On(Coffee,Bar)\"}"}, "æµ‹è¯•VLMï¼šåšä¸€æ¯å’–å•¡æ”¾åˆ°æ°´æ¯æ¡Œä¸Šå¹¶å€’æ°´": {"Answer": "æµ‹è¯•VLMï¼šåšä¸€æ¯å’–å•¡æ”¾åˆ°æ°´æ¯æ¡Œä¸Šå¹¶å€’æ°´", "Goal": "{\"On(Coffee,WaterTable)\"}"}, "æµ‹è¯•VLNï¼šå‰å¾€2å·æ¡Œ": {"Answer": "æµ‹è¯•VLNï¼šå‰å¾€2å·æ¡Œ", "Goal": "{\"At(Robot,Table2)\"}"}, "æµ‹è¯•AEM": {"Answer": "æµ‹è¯•AEM", "Goal": "{\"EnvExplored()\"}"}, "æµ‹è¯•VLMï¼šå€’ä¸€æ¯æ°´": {"Answer": "æµ‹è¯•VLMï¼šå€’ä¸€æ¯æ°´", "Goal": "{\"On(Water,WaterTable)\"}"}, "æµ‹è¯•VLMï¼šå¼€ç©ºè°ƒ": {"Answer": "æµ‹è¯•VLMï¼šå¼€ç©ºè°ƒ", "Goal": "{\"Is(AC,On)\"}"}, "æµ‹è¯•VLMï¼šå…³ç©ºè°ƒ": {"Answer": "æµ‹è¯•VLMï¼šå…³ç©ºè°ƒ", "Goal": "{\"Is(AC,Off)\"}"}, "æµ‹è¯•VLMï¼šå…³å¤§åŽ…ç¯": {"Answer": "æµ‹è¯•VLMï¼šå…³å¤§åŽ…ç¯", "Goal": "{\"Is(HallLight,Off)\"}"}, "æµ‹è¯•VLMï¼šå¼€å¤§åŽ…ç¯": {"Answer": "æµ‹è¯•VLMï¼šå¼€å¤§åŽ…ç¯", "Goal": "{\"Is(HallLight,On)\"}"}, "æµ‹è¯•VLMï¼šå…³ç­’ç¯": {"Answer": "æµ‹è¯•VLMï¼šå…³ç­’ç¯", "Goal": "{\"Is(TubeLight,Off)\"}"}, "æµ‹è¯•VLMï¼šå¼€ç­’ç¯": {"Answer": "æµ‹è¯•VLMï¼šå¼€ç­’ç¯", "Goal": "{\"Is(TubeLight,On)\"}"}, "æµ‹è¯•VLMï¼šå…³çª—å¸˜": {"Answer": "æµ‹è¯•VLMï¼šå…³çª—å¸˜", "Goal": "{\"Is(Curtain,Off)\"}"}, "æµ‹è¯•VLMï¼šå¼€çª—å¸˜": {"Answer": "æµ‹è¯•VLMï¼šå¼€çª—å¸˜", "Goal": "{\"Is(Curtain,On)\"}"}, "æµ‹è¯•VLMï¼šæ‹–åœ°": {"Answer": "æµ‹è¯•VLMï¼šæ‹–åœ°", "Goal": "{\"Is(Floor,Clean)\"}"}, "æµ‹è¯•VLMï¼šæ“¦æ¡Œå­": {"Answer": "æµ‹è¯•VLMï¼šæ“¦æ¡Œå­", "Goal": "{\"Is(Table1,Clean)\"}"}, "æµ‹è¯•VLMï¼šæ•´ç†æ¤…å­": {"Answer": "æµ‹è¯•VLMï¼šæ•´ç†æ¤…å­", "Goal": "{\"Is(Chairs,Clean)\"}"}, "æµ‹è¯•VLMï¼šæŠŠå†°çº¢èŒ¶æ”¾åˆ°Table2": {"Answer": "æµ‹è¯•VLMï¼šæŠŠå†°çº¢èŒ¶æ”¾åˆ°Table2", "Goal": "{\"On(BottledDrink,Table2)\"}"}, "æˆ‘æœ‰ç‚¹çƒ­ï¼Œèƒ½å¼€ä¸ªç©ºè°ƒå—ï¼Ÿ": {"Answer": "å½“ç„¶å¯ä»¥ï¼Œæˆ‘çŽ°åœ¨å°±å¼€ï¼", "Goal": "{\"Is(AC,On)\"}"}, "å¯ä»¥å¸¦æˆ‘åŽ»å—": {"Answer": "å½“ç„¶å¯ä»¥ï¼Œå‰å¾€ä¸€å·æ¡Œ", "Goal": "{\"At(Robot,Table1)\"}"}}
+{"æµ‹è¯•VLMï¼šåšä¸€æ¯å’–å•¡": {"Answer": "æµ‹è¯•VLMï¼šåšä¸€æ¯å’–å•¡", "Goal": "{\"On(Coffee,CoffeeTable)\"}"}, "æµ‹è¯•VLMï¼šåšä¸€æ¯å’–å•¡æ”¾åˆ°å§å°ä¸Š": {"Answer": "æµ‹è¯•VLMï¼šåšä¸€æ¯å’–å•¡æ”¾åˆ°å§å°ä¸Š", "Goal": "{\"On(Coffee,Bar)\"}"}, "æµ‹è¯•VLMï¼šåšä¸€æ¯å’–å•¡æ”¾åˆ°æ°´æ¯æ¡Œä¸Šï¼Œå†å€’ä¸€æ¯æ°´": {"Answer": "æµ‹è¯•VLMï¼šåšä¸€æ¯å’–å•¡æ”¾åˆ°æ°´æ¯æ¡Œä¸Šï¼Œå†å€’ä¸€æ¯æ°´", "Goal": "{\"On(Coffee,WaterTable)\",\"On(Water,WaterTable)\"}"}, "æµ‹è¯•VLNï¼šå‰å¾€2å·æ¡Œ": {"Answer": "æµ‹è¯•VLNï¼šå‰å¾€2å·æ¡Œ", "Goal": "{\"At(Robot,Table2)\"}"}, "æµ‹è¯•AEM": {"Answer": "æµ‹è¯•AEM", "Goal": "{\"EnvExplored()\"}"}, "æµ‹è¯•VLMï¼šå€’ä¸€æ¯æ°´": {"Answer": "æµ‹è¯•VLMï¼šå€’ä¸€æ¯æ°´", "Goal": "{\"On(Water,WaterTable)\"}"}, "æµ‹è¯•VLMï¼šå¼€ç©ºè°ƒ": {"Answer": "æµ‹è¯•VLMï¼šå¼€ç©ºè°ƒ", "Goal": "{\"Is(AC,On)\"}"}, "æµ‹è¯•VLMï¼šå…³ç©ºè°ƒ": {"Answer": "æµ‹è¯•VLMï¼šå…³ç©ºè°ƒ", "Goal": "{\"Is(AC,Off)\"}"}, "æµ‹è¯•VLMï¼šå…³å¤§åŽ…ç¯": {"Answer": "æµ‹è¯•VLMï¼šå…³å¤§åŽ…ç¯", "Goal": "{\"Is(HallLight,Off)\"}"}, "æµ‹è¯•VLMï¼šå¼€å¤§åŽ…ç¯": {"Answer": "æµ‹è¯•VLMï¼šå¼€å¤§åŽ…ç¯", "Goal": "{\"Is(HallLight,On)\"}"}, "æµ‹è¯•VLMï¼šå…³ç­’ç¯": {"Answer": "æµ‹è¯•VLMï¼šå…³ç­’ç¯", "Goal": "{\"Is(TubeLight,Off)\"}"}, "æµ‹è¯•VLMï¼šå¼€ç­’ç¯": {"Answer": "æµ‹è¯•VLMï¼šå¼€ç­’ç¯", "Goal": "{\"Is(TubeLight,On)\"}"}, "æµ‹è¯•VLMï¼šå…³çª—å¸˜": {"Answer": "æµ‹è¯•VLMï¼šå…³çª—å¸˜", "Goal": "{\"Is(Curtain,Off)\"}"}, "æµ‹è¯•VLMï¼šå¼€çª—å¸˜": {"Answer": "æµ‹è¯•VLMï¼šå¼€çª—å¸˜", "Goal": "{\"Is(Curtain,On)\"}"}, "æµ‹è¯•VLMï¼šæ‹–åœ°": {"Answer": "æµ‹è¯•VLMï¼šæ‹–åœ°", "Goal": "{\"Is(Floor,Clean)\"}"}, "æµ‹è¯•VLMï¼šæ“¦æ¡Œå­": {"Answer": "æµ‹è¯•VLMï¼šæ“¦æ¡Œå­", "Goal": "{\"Is(Table1,Clean)\"}"}, "æµ‹è¯•VLMï¼šæ•´ç†æ¤…å­": {"Answer": "æµ‹è¯•VLMï¼šæ•´ç†æ¤…å­", "Goal": "{\"Is(Chairs,Clean)\"}"}, "æµ‹è¯•VLMï¼šæŠŠå†°çº¢èŒ¶æ”¾åˆ°Table2": {"Answer": "æµ‹è¯•VLMï¼šæŠŠå†°çº¢èŒ¶æ”¾åˆ°Table2", "Goal": "{\"On(BottledDrink,Table2)\"}"}, "æˆ‘æœ‰ç‚¹çƒ­ï¼Œèƒ½å¼€ä¸ªç©ºè°ƒå—ï¼Ÿ": {"Answer": "å½“ç„¶å¯ä»¥ï¼Œæˆ‘çŽ°åœ¨å°±å¼€ï¼", "Goal": "{\"Is(AC,On)\"}"}, "å¯ä»¥å¸¦æˆ‘åŽ»å—": {"Answer": "å½“ç„¶å¯ä»¥ï¼Œå‰å¾€ä¸€å·æ¡Œ", "Goal": "{\"At(Robot,Table1)\"}"}}
diff --git a/robowaiter/llm_client/data_raw/test_questions.csv b/robowaiter/llm_client/data_raw/test_questions.csv
index 3bb7a86..19b8af4 100644
--- a/robowaiter/llm_client/data_raw/test_questions.csv
+++ b/robowaiter/llm_client/data_raw/test_questions.csv
@@ -1,7 +1,7 @@
 Question,Answer,Goal
 ²âÊÔVLM£º×öÒ»±­¿§·È,²âÊÔVLM£º×öÒ»±­¿§·È,"{""On(Coffee,CoffeeTable)""}"
 ²âÊÔVLM£º×öÒ»±­¿§·È·Åµ½°ÉÌ¨ÉÏ,²âÊÔVLM£º×öÒ»±­¿§·È·Åµ½°ÉÌ¨ÉÏ,"{""On(Coffee,Bar)""}"
-²âÊÔVLM£º×öÒ»±­¿§·È·Åµ½Ë®±­×ÀÉÏ²¢µ¹Ë®,²âÊÔVLM£º×öÒ»±­¿§·È·Åµ½Ë®±­×ÀÉÏ²¢µ¹Ë®,"{""On(Coffee,WaterTable)""}"
+²âÊÔVLM£º×öÒ»±­¿§·È·Åµ½Ë®±­×ÀÉÏ£¬ÔÙµ¹Ò»±­Ë®,²âÊÔVLM£º×öÒ»±­¿§·È·Åµ½Ë®±­×ÀÉÏ£¬ÔÙµ¹Ò»±­Ë®,"{""On(Coffee,WaterTable)"",""On(Water,WaterTable)""}"
 ²âÊÔVLN£ºÇ°Íù2ºÅ×À,²âÊÔVLN£ºÇ°Íù2ºÅ×À,"{""At(Robot,Table2)""}"
 ²âÊÔAEM,²âÊÔAEM,"{""EnvExplored()""}"
 ²âÊÔVLM£ºµ¹Ò»±­Ë®,²âÊÔVLM£ºµ¹Ò»±­Ë®,"{""On(Water,WaterTable)""}"
diff --git a/robowaiter/llm_client/data_tools/csv2dict.py b/robowaiter/llm_client/data_tools/csv2dict.py
index 31feb97..6660c79 100644
--- a/robowaiter/llm_client/data_tools/csv2dict.py
+++ b/robowaiter/llm_client/data_tools/csv2dict.py
@@ -24,4 +24,3 @@ with open(csv_file_path, mode='r', encoding='gbk') as csv_file, \
     json_str = json.dumps(output_dict, ensure_ascii=False)
     # å°†JSONå­—ç¬¦ä¸²å†™å…¥JSONLæ–‡ä»¶ï¼Œå¹¶æ·»åŠ æ¢è¡Œç¬¦
     jsonl_file.write(json_str + '\n')
-s
\ No newline at end of file
diff --git a/robowaiter/scene/tasks/VLM.py b/robowaiter/scene/tasks/VLM/VLM.py
similarity index 95%
rename from robowaiter/scene/tasks/VLM.py
rename to robowaiter/scene/tasks/VLM/VLM.py
index 23cd3af..04e2caf 100644
--- a/robowaiter/scene/tasks/VLM.py
+++ b/robowaiter/scene/tasks/VLM/VLM.py
@@ -22,7 +22,10 @@ class SceneVLM(Scene):
             # (5, self.create_chat_event("æµ‹è¯•VLMï¼šæŠŠå†°çº¢èŒ¶æ”¾åˆ°Table2")),
             # (5, self.create_chat_event("æµ‹è¯•VLMï¼šå…³å¤§åŽ…ç¯"))
             # (5, self.create_chat_event("æµ‹è¯•VLMï¼šåšä¸€æ¯å’–å•¡æ”¾åˆ°å§å°ä¸Š")),
-            (5, self.create_chat_event("æµ‹è¯•VLMï¼šåšä¸€æ¯å’–å•¡æ”¾åˆ°æ°´æ¯æ¡Œä¸Šå¹¶å€’æ°´")),
+            (5, self.create_chat_event("æµ‹è¯•VLMï¼šåšä¸€æ¯å’–å•¡æ”¾åˆ°æ°´æ¯æ¡Œä¸Šï¼Œå†å€’ä¸€æ¯æ°´")),
+            (10, self.create_chat_event("æµ‹è¯•VLMï¼šå…³çª—å¸˜")),
+            # (5, self.create_chat_event("æµ‹è¯•VLNï¼šå‰å¾€2å·æ¡Œ")),
+
         ]
 
     def _reset(self):
diff --git a/robowaiter/scene/tasks/VLM/VLM2.py b/robowaiter/scene/tasks/VLM/VLM2.py
new file mode 100644
index 0000000..6872edd
--- /dev/null
+++ b/robowaiter/scene/tasks/VLM/VLM2.py
@@ -0,0 +1,123 @@
+"""
+è§†è§‰è¯­è¨€æ“ä½œ
+æœºå™¨äººæ ¹æ®æŒ‡ä»¤äººçš„æŒ‡ä»¤è°ƒèŠ‚ç©ºè°ƒï¼Œè‡ªä¸»æŽ¢ç´¢çŽ¯å¢ƒå¯¼èˆªåˆ°ç›®æ ‡ç‚¹ï¼Œé€šè¿‡æ‰‹è‡‚çš„è¿åŠ¨è§„åˆ’èƒ½åŠ›æ“ä½œç©ºè°ƒï¼Œæ¯”å¦‚å¼€å…³æŒ‰é’®ã€è°ƒæ¸©æŒ‰é’®ã€æ˜¾ç¤ºé¢æ¿
+"""
+
+import time
+from robowaiter.scene.scene import Scene
+
+class SceneVLM(Scene):
+    def __init__(self, robot):
+        super().__init__(robot)
+        # åœ¨è¿™é‡ŒåŠ å…¥åœºæ™¯ä¸­å‘ç”Ÿçš„äº‹ä»¶ï¼Œ (äº‹ä»¶å‘ç”Ÿçš„æ—¶é—´ï¼Œäº‹ä»¶å‡½æ•°)
+        self.event_list = [
+            # (5, self.create_chat_event("æµ‹è¯•VLMï¼šåšä¸€æ¯å’–å•¡")),
+            # (5, self.create_chat_event("æµ‹è¯•VLMï¼šå€’ä¸€æ¯æ°´")),
+            # (5, self.create_chat_event("æµ‹è¯•VLMï¼šå¼€ç©ºè°ƒ")),
+            # (5, self.create_chat_event("æµ‹è¯•VLMï¼šå…³ç©ºè°ƒ")),
+            # (5, self.create_chat_event("æµ‹è¯•VLMï¼šå¼€å¤§åŽ…ç¯")),
+            # (5, self.create_chat_event("æµ‹è¯•VLMï¼šæ‹–åœ°")),
+            # (7, self.create_chat_event("æµ‹è¯•VLMï¼šæ“¦æ¡Œå­")),
+            # (5, self.create_chat_event("æµ‹è¯•VLMï¼šæ•´ç†æ¤…å­")),
+            # (5, self.create_chat_event("æµ‹è¯•VLMï¼šæŠŠå†°çº¢èŒ¶æ”¾åˆ°Table2")),
+            # (5, self.create_chat_event("æµ‹è¯•VLMï¼šå…³å¤§åŽ…ç¯"))
+            # (5, self.create_chat_event("æµ‹è¯•VLMï¼šåšä¸€æ¯å’–å•¡æ”¾åˆ°å§å°ä¸Š")),
+            # (5, self.create_chat_event("æµ‹è¯•VLMï¼šåšä¸€æ¯å’–å•¡æ”¾åˆ°æ°´æ¯æ¡Œä¸Šå¹¶å€’æ°´")),
+            # (8, self.create_chat_event("æµ‹è¯•VLNï¼šå‰å¾€1å·æ¡Œ")),
+
+        ]
+
+    def _reset(self):
+
+        # self.gen_obj(type=5)
+        # self.gen_obj(type=9)
+        # self.op_task_execute(op_type=16, obj_id=0)
+        # self.move_task_area(op_type=4)
+        pass
+
+    def _run(self, op_type=10):
+        # ä¸€ä¸ªè¡Œäººä»Žé—¨å£èµ°åˆ° å§å°
+        # æ‰“æ‹›å‘¼éœ€è¦ä»€ä¹ˆ
+        # è¡Œäººè¯´ å“ªé‡Œæœ‰ä½ç½®ï¼Œæƒ³æ™’ä¸ªå¤ªé˜³
+        # å¸¦é¢†è¡ŒäººåŽ»æœ‰å¤ªé˜³çš„åœ°æ–¹
+        # è¡Œäººè¯´ æœ‰ç‚¹çƒ­
+        # å¥½çš„ï¼Œè¿™å°±åŽ»å¼€ç©ºè°ƒ
+
+        scene = self.add_walkers([[0, 0]])
+        self.control_walker(
+            [self.walker_control_generator(walkerID=1, autowalk=False, speed=50, X=100, Y=150, Yaw=0)])
+
+        cont = scene.walkers[0].name+":æˆ‘æœ‰ç‚¹çƒ­ï¼Œèƒ½å¼€ä¸ªç©ºè°ƒå—ï¼Ÿ"
+        self.control_robot_action(0,3,cont)
+
+
+        # å…±17ä¸ªæ“ä½œ
+        # "åˆ¶ä½œå’–å•¡","å€’æ°´","å¤¹ç‚¹å¿ƒ","æ‹–åœ°","æ“¦æ¡Œå­","å¼€ç­’ç¯","æ¬æ¤…å­",    # 1-7
+        # "å…³ç­’ç¯","å¼€å¤§åŽ…ç¯","å…³å¤§åŽ…ç¯","å…³é—­çª—å¸˜","æ‰“å¼€çª—å¸˜",            # 8-12
+        # "è°ƒæ•´ç©ºè°ƒå¼€å…³","è°ƒé«˜ç©ºè°ƒæ¸©åº¦","è°ƒä½Žç©ºè°ƒæ¸©åº¦",                   # 13-15
+        # "æŠ“æ¡ç‰©ä½“","æ”¾ç½®ç‰©ä½“"                                       # 16-17
+
+        # self.gen_obj()
+        # if op_type <=15:
+        #     self.move_task_area(op_type)
+        #     self.op_task_execute(op_type)
+        # if op_type == 16:   # 16: æŠ“æ“ä½œéœ€è¦ä¼ å…¥ç‰©å“id
+        #     self.move_task_area(op_type, obj_id=0)
+        #     self.op_task_execute(op_type, obj_id=0)
+        # # åŽŸå§‹å§å°å¤„:[247.0, 520.0, 100.0], ç©ºè°ƒå¼€å…³æ—å§å°:[240.0, 40.0, 100.0], æ°´æ¯æ¡Œ:[-70.0, 500.0, 107]
+        # # æ¡Œå­1:[-55.0, 0.0, 107],æŠ¹å¸ƒæ¡Œ:[340.0, 900.0, 99.0]   # æ¡Œå­2:[-55.0, 150.0, 107],
+        # if op_type == 17:   # 17: æ”¾æ“ä½œéœ€è¦ä¼ å…¥æ”¾ç½®ä½ç½®å‘¨å›´çš„å¯è¾¾åŒºåŸŸ
+        #     pos = [240.0, 40.0, 100.0]
+        #     self.move_task_area(op_type, release_pos=pos)
+        #     self.op_task_execute(op_type, release_pos=pos)   # [325.0, 860.0, 100]
+
+        # æµç¨‹æµ‹è¯•
+        # æŠ“æ¡æ”¾ç½®:æŠ“å§å°å‰ç”Ÿæˆçš„é…¸å¥¶ï¼Œæ”¾åˆ°æŠ¹å¸ƒæ¡Œä¸Š
+        self.gen_obj()
+        # self.move_task_area(16, obj_id=0)
+        # self.op_task_execute(16, obj_id=0)
+        # pos = [340.0, 900.0, 99.0]
+        # self.move_task_area(17, release_pos=pos)
+        # self.op_task_execute(17, release_pos=pos)
+        #
+        # # åšå’–å•¡:åšå®Œçš„å’–å•¡æ”¾åˆ°æ°´æ¯æ¡Œä¸Š
+        # self.move_task_area(1)
+        # self.op_task_execute(1)
+        #
+        # self.find_obj("CoffeeCup")
+        #
+        # self.move_task_area(16, obj_id=275)
+        # self.op_task_execute(16, obj_id=275)
+        # pos = [-70.0, 500.0, 107]
+        # self.move_task_area(17, release_pos=pos)
+        # self.op_task_execute(17, release_pos=pos)
+        #
+        # # å€’æ°´:å€’å®Œçš„æ°´æ”¾åˆ°æ—è¾¹æ¡Œå­ä¸Š
+        # self.move_task_area(2)
+        # self.op_task_execute(2)
+
+        #
+        # self.move_task_area(16, obj_id=190)
+        # self.op_task_execute(16, obj_id=190)
+        # pos = [-55.0, 0.0, 107]
+        # self.move_task_area(17, release_pos=pos)
+        # self.op_task_execute(17, release_pos=pos)
+
+        # self.test_yaw()
+
+        pass
+    
+    def _step(self):
+        pass
+
+
+if __name__ == '__main__':
+    import os
+    from robowaiter.robot.robot import Robot
+
+    robot = Robot()
+
+    # create task
+    task = SceneVLM(robot)
+    task.reset()
+    task.run()
diff --git a/robowaiter/scene/tasks/VLM/__init__.py b/robowaiter/scene/tasks/VLM/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/sub_task.ptml b/sub_task.ptml
index bc19507..33895cd 100644
--- a/sub_task.ptml
+++ b/sub_task.ptml
@@ -1,5 +1,10 @@
 selector{
-cond On(Coffee,CoffeeTable)
+
+sequence{
+    cond On(Coffee,CoffeeTable)
+    cond On(Coffee,CoffeeTable)
+    }
+
 sequence{
 cond Holding(Nothing)
 act Make(Coffee)