from RoboMemory.Agents.ACAgent import ActorCritic
from RoboMemory.Agents.MemoryAgent import Memory
from RoboMemory.Agents.InformationProcess import InfoProcessor
from RoboMemory.BaseModules.BaseMemory import BaseMemory
from RoboMemory.Envs.ALFREDEnv import ALFREDEnv
from RoboMemory.Modules.Memories.ShortTermMemory import TemporalShortTermMemory, BufferSummarizer, TemporalShortTermMemoryAggregator
from RoboMemory.VariableManager.EBVariableManagers import ALFERDVariableManager
from RoboMemory.agent_utils import ModelConfig, VectorDBConfig
from RoboMemory.Evaluator.EbEvaluator import EmbodiedBenchEvaluator
from RoboMemory.SpatialMemory.spatial_memory import SpatialMemory, SpatialAnalyzer, SpatialMemoryAggregator
import asyncio
from BaseMain import BaseMain
from RoboMemory.Datas.DataCollectLogger import DataLogger
from datetime import datetime
import yaml
import os
import time
import logging
from RoboMemory.Modules.Memories.LTM.EpsodicMem import EpisodicMemory, EpisodicMemoryAggregator, AutobioGenerator
from RoboMemory.Modules.Memories.LTM.SemanticMem import SemanticMemory, SemanticMemAggregator, SemanticMemUpdater, SemExtractor, SemanticMemGenerator

# DIRs
MEMORY_DIR = f"./ckpt/MemoryBuffer" #   


#    vlm

API_KEY = "<|your api key|>"
BASE_URL = "https://dashscope.aliyuncs.com/compatible-mode/v1"


class ALFREDRoboMemoryAgent(BaseMain):
    def __init__(
            self,
            
            # Actor Critic config
            actor_config: ModelConfig,
            critic_config: ModelConfig,
            actor_prompt_path: str,
            critic_prompt_path: str,
            
            # Info preprocessor
            step_summarizer_config: ModelConfig,
            spatial_query_generator_config: ModelConfig,
            semantic_query_generator_config: ModelConfig,
            episodic_query_generator_config: ModelConfig,
            step_summarizer_prompt: str,
            spatial_query_generator_prompt: str,
            semantic_query_generator_prompt: str,
            episodic_query_generator_prompt: str,
            
            # Memory Config
            temporal_short_term_memory_config : ModelConfig,
            spatial_short_term_memory_config : ModelConfig,
            embedding_config : ModelConfig,
            
            # Long Term Memory Config
            episodic_memory_generator_config : ModelConfig,
            semantic_memory_upater_config : ModelConfig,
            semantic_memory_generator_config : ModelConfig,
            semantic_memory_extractor_config : ModelConfig,
            
            # function   
            function_filter_list = ['drop'],
            selected_indexes = 0,
            eval_set_index = 0,
            
            # example
            example_path = "./RoboMemory/templates/Knowledge/sample.txt",
            knowledge_path = "./RoboMemory/templates/Knowledge/knowledge.txt",
            
            # ckpt
            ckpt_path: str = "./ckpt", 
            record_name: str = "TASK", 
            image_dir_name: str = "img", 
            image_type: str = "jpeg",
            
            # result record path
            result_record_dir : str = "./evaluation",
            
            # optional setings:
            max_step: int =  40,
            
            # Ablation
            planner_obs : bool = True,
            critic_obs : bool = True,
            use_critic : bool = True,
        ):
        super().__init__()
        
        self.ACagent = ActorCritic(
            actor_config = actor_config,
            critic_config = critic_config,
            actor_prompt_path = actor_prompt_path,
            critic_prompt_path = critic_prompt_path
        )
        
        self.info_preprocessor = InfoProcessor(
            step_summarizer_config=step_summarizer_config,
            spatial_query_generator_config = spatial_query_generator_config,
            semantic_query_generator_config = semantic_query_generator_config,
            episodic_query_generator_config = episodic_query_generator_config,
            step_summarizer_prompt = step_summarizer_prompt,
            spatial_query_generator_prompt = spatial_query_generator_prompt ,
            semantic_query_generator_prompt = semantic_query_generator_prompt,  
            episodic_query_generator_prompt = episodic_query_generator_prompt
        )
        
        self.env = ALFREDEnv(selected_indexes, eval_set_index, function_filter_list = function_filter_list)
        self.selected_indexes = selected_indexes
        self.eval_set_index = eval_set_index
        
        # logger        
        self.ckpt_path = ckpt_path
        self.record_name = record_name
        self.image_dir_name = image_dir_name
        
        
        self.task_start_time = time.time() #    bug
        
        
        self.init_time = datetime.now().strftime("%m%d_%H%M")
        
        self.api_descriptions = self.env.api_processor.get_api_description()
        
        self.ckpt_path = f"{self.ckpt_path}/{self.init_time}-[{self.eval_set_index}-{self.selected_indexes}]-{self.env.task}"
        
        self.image_type = image_type
        
        self.step = 0
        
        self.max_step = max_step
        
        
        with open(example_path, 'r', encoding='utf-8') as f:   
            self.examples = f.read()
        
        with open(knowledge_path, 'r', encoding='utf-8') as f:   
            self.knowledges = f.read()
        
        self.global_var = ALFERDVariableManager()
        
        self.evaluator = EmbodiedBenchEvaluator(eval_csv_dir = result_record_dir)
        
        #     Memory
        
        self.memories = []
        
        self.short_term_memory_list = []
        
        self.long_term_memory_list = []
        
        self.init_short_term_memory(
            temporal_short_term_memory_config = temporal_short_term_memory_config,
            spatial_short_term_memory_config = spatial_short_term_memory_config,
            embedding_config = embedding_config,
        )
        
        self.init_long_term_memory(
            episodic_memory_generator_config = episodic_memory_generator_config,
            semantic_memory_generator_config = semantic_memory_generator_config,
            semantic_memory_upater_config = semantic_memory_upater_config,
            semantic_memory_extractor_config = semantic_memory_extractor_config,
            embedding_config = embedding_config,
        )
        
        self.memory = Memory(
            memory_list = self.memories
        )
        
        
        #    memory
        self.short_term_memory = Memory(
            memory_list= self.short_term_memory_list
        )
        
        self.long_term_memory = Memory(
            memory_list= self.long_term_memory_list
        )
        
        
        # ablation
        
        self.planner_obs = planner_obs
        self.critic_obs = critic_obs
        self.use_critic = use_critic
        
    def init_short_term_memory(
            self,
            temporal_short_term_memory_config : ModelConfig,
            spatial_short_term_memory_config : ModelConfig,
            embedding_config : ModelConfig,
        ):
       
        # Short Term Memory
        self.temporal_summarizer = BufferSummarizer(
            model_config=temporal_short_term_memory_config, 
            template_path="./RoboMemory/templates/prompts/ShortTermMemory.prompt"
        )

        self.temporal_aggregator = TemporalShortTermMemoryAggregator()
        
        self.temporal_short_term_memory = TemporalShortTermMemory(
            updater = self.temporal_summarizer, 
            aggregator = self.temporal_aggregator,
            memory_path = MEMORY_DIR,
            restore = False,
            max_capacity = 3
        )
        
        # Spatial Memory
        
        self.spatial_analyzer = SpatialAnalyzer(
            model_config = spatial_short_term_memory_config,
            template_path="./RoboMemory/templates/prompts/TripletExtraction.prompt",
            integration_template_path="./RoboMemory/templates/prompts/InformationIntegration.prompt"
        )
        
        
        self.spatial_aggregator = SpatialMemoryAggregator()
        
        #        
        vectordb_config = VectorDBConfig(
            collection_name="spatial_vector_db",
            persist_directory=f"{self.ckpt_path}/Spatial_vectorDB"
        )
        
        self.spatial_memory = SpatialMemory(
            updater=self.spatial_analyzer,
            aggregator=self.spatial_aggregator,
            embedding_config=embedding_config,
            vectordb_config=vectordb_config,
            graph_db_path=f"{self.ckpt_path}",
            graph_db_name="semantic_graph.pkl",
            enable_forgetting = False,
            memory_path = f"{self.ckpt_path}/MemoryBuffer", #       
            logging_path = f"{self.ckpt_path}",
            enable_visualization=True,
            visualization_config = {
                'output_dir': f"{self.ckpt_path}/Spatial_Graph",
                'enable_chinese_font': True
            },
            graph_search_top_k = 3,
            graph_search_adj_degree = 2
        )

        short_term_memory = [self.temporal_short_term_memory, self.spatial_memory]
        
        self.memories.extend(short_term_memory)
        self.short_term_memory_list.extend(short_term_memory)
        
        
    def init_long_term_memory(
            self,
            episodic_memory_generator_config : ModelConfig,
            semantic_memory_generator_config : ModelConfig,
            semantic_memory_upater_config : ModelConfig,
            semantic_memory_extractor_config : ModelConfig,
            embedding_config : ModelConfig 
        ):
       
        
        # episodic memory
        

        self.episodic_aggregator = EpisodicMemoryAggregator()
        
        self.autobio_generator = AutobioGenerator(episodic_memory_generator_config)
        
        self.episodic_memory = EpisodicMemory(
            aggregator=self.episodic_aggregator,
            autobio_generator=self.autobio_generator,
            embedding_config=embedding_config,
            vectordb_config=VectorDBConfig(
                collection_name="episodic_vector_db",
                persist_directory=f"{self.ckpt_path}/Episodic_vectorDB"
            ),
            retrieve_k_task=5,
            log_path = self.ckpt_path
        )

        # semantic memory
        self.semantic_updater = SemanticMemUpdater(semantic_memory_upater_config)
        
        self.semantic_aggregator = SemanticMemAggregator()
        
        self.semantic_generator = SemanticMemGenerator(semantic_memory_generator_config)
        
        self.semantic_extractor = SemExtractor(semantic_memory_extractor_config)
        
         
        
        self.semantic_memory = SemanticMemory(
            updater=self.semantic_updater,
            aggregator=self.semantic_aggregator,
            extractor=self.semantic_extractor,
            memory_generator=self.semantic_generator,  
            embedding_config=embedding_config,
            vectordb_config=VectorDBConfig(
                collection_name="semantic_vector_db",
                persist_directory=f"{MEMORY_DIR}/Semantic_vectorDB"
            ),
            retrieve_k_task=2, #    top-k
            retrieve_k_action=2,
            top_k=10, #    top-k
            log_path = self.ckpt_path
        )
        
        long_term_memory_list = [
            #self.episodic_memory, 
            self.semantic_memory
        ]
        
        self.memories.extend(long_term_memory_list)
        self.long_term_memory_list.extend(long_term_memory_list)
        
    
    async def task_level_memory_update(self):
     
        
        memory_infos = {
            "step_summary": self.global_var.current_step_summary,
            "possible_objects": self.env.objects,
        }
        
        if self.global_var.global_step > 1:
            memory_infos["SemanticMemory"] = {
                "iterations": self.global_var.current_belief.get("TemporalShortTermMemory", 'No belief available now'),
                "action": self.global_var.current_action
            }
            
            memory_update_successes = await self.memory.update(memory_infos)
        
        else:
            #                
            memory_update_successes = await self.short_term_memory.update(memory_infos)
        
        #           temporal belief 
        infos = {
            "SemanticMemory": {
                "task": self.env.task,
                "iterations": self.global_var.current_belief.get("TemporalShortTermMemory", 'No belief available now'), #          spatial memory              spatial memory                      
                "api_descriptions": self.api_descriptions 
            },
            "EpisodicMemory": {
                "task": self.env.task,
                "iterations": self.global_var.current_belief.get("TemporalShortTermMemory", 'No belief available now'), #          spatial memory              spatial memory                      
                "api_descriptions": self.api_descriptions 
            },
        }
        
        # 3. Update
        await self.long_term_memory.update(
            infos = infos
        )
        
        del infos
        
        
        
        
    async def run(self) -> bool:
        
        error = False
        
      
        
        
        
        try:
            await self.inner_run()
            error_message = "correct"
            error = False
        except Exception as e:
            error_message = str(e)
            logging.error(error_message) 
            error = True
            # raise e
        
        task_end_time = time.time()
        #         
        await self.task_level_memory_update()
        
        total_time = task_end_time - self.task_start_time
        self.global_var.update_variables(run_time = total_time)
        
        self.evaluator.record_data(
            env_type = "alfred", # alfred    habitat
            task_type = self.eval_set_index, # 0-5  5 
            task_name = self.env.task, # task   
            task_id = self.selected_indexes, #  task    id
            
            #     
            total_iteration = self.global_var.global_step,
            total_time = self.global_var.run_time,
            
            #     
            success = self.global_var.task_success,
            max_progress = self.global_var.max_progress,
            
            # Error   
            error_message = error_message
        )
        
        if hasattr(self, "logger"):
            self.logger.console_log(global_step = -1, returns = yaml.dump(self.global_var.action_list))
        
        self.evaluator.save()
        self.env.close()
        
        return error
            
            
        
    async def inner_run(self):
 
          
        
        img, score, done, info = self.env.reset()
        
        #      variable
        self.global_var.update_variables(
            global_step = self.step,
            current_img = img,
            score = score,
            done = done,
            current_info = info,
            env_feedback_info = f"Task initialized." #    
        )
        
        #    logger   task
        self.logger = DataLogger(
            ckpt_path = self.ckpt_path, 
            record_name = self.record_name, 
            image_dir_name = self.image_dir_name, 
            image_type = self.image_type
        )
        
        del img, score, done, info
        
        self.task_start_time = time.time()
        
        while not (self.global_var.done or self.global_var.truncated):
                
            query_params = {
                "memory": self.global_var.current_belief,
                "task": self.env.task
            }
            
            step_sum_params = {
                "current_action": self.global_var.current_action,
                "feedback": self.global_var.env_feedback_info,
                "current_belief": {
                    "Temporal Memory": self.global_var.current_belief.get("TemporalShortTermMemory", 'No belief available now'),
                    "Spatial Memory": self.global_var.current_belief.get("SpatialMemory", '')
                },
                "working_memory": self.global_var.current_step_summary, #           
                "functions": self.api_descriptions,
                "examples": self.examples
            }
            
            step_summary, spatial_queries, semantic_queries, episodic_queries = await self.info_preprocessor.generate_infos(
                query_params = query_params,
                step_sum_params = step_sum_params,
                image_paths = self.global_var.current_img,
                image_type = self.image_type
            )
            
            self.global_var.update_variables(
                current_step_summary = step_summary,
                current_spatial_queries = spatial_queries,
                current_semantic_queries = semantic_queries,
                current_episodic_queries = episodic_queries
            )
            
            
            del step_summary, spatial_queries, semantic_queries, episodic_queries, query_params, step_sum_params
            
            image_paths = self.global_var.current_img if self.planner_obs else None
            
            actor_params = {
                "task": self.env.task,
                "functions": self.api_descriptions,
                "objects": self.env.objects,
                "examples": self.examples,
                "last_action": self.global_var.last_action
            }
            
            # plan
            if self.global_var.action_suitability: #           memory
                
                #       
                # Memory update (Plan)
                # Memory               warning  return           memory      memory_infos
                
                    
                # non-parallel  update -> retrieve -> plan
                
                #     memory      
                
                # step > 1                            0        1   feedback        
                memory_infos = {
                    "step_summary": self.global_var.current_step_summary,
                    "possible_objects": self.env.objects,
                }
                
                if self.global_var.global_step > 1:
                    memory_infos["SemanticMemory"] = {
                        "iterations": self.global_var.current_belief.get("TemporalShortTermMemory", 'No belief available now'),
                        "action": self.global_var.current_action,
                        "api_descriptions": self.api_descriptions 
                    }
                    
                    memory_update_successes = await self.memory.update(memory_infos)
                
                else:
                    #                
                    memory_update_successes = await self.short_term_memory.update(memory_infos)
                
                
                
                # step > 0           
                if self.global_var.global_step > 0:
                    
                    queries = {
                        "SpatialMemory": self.global_var.current_spatial_queries,
                        "SemanticMemory": self.global_var.current_semantic_queries, 
                        "EpisodicMemory": self.global_var.current_episodic_queries 
                    } #      queries_list        Query  memory     
                    
                    
                    self.logger.console_log(global_step = self.step, returns = queries, agent_name = "Queries for spatial memory") #    belief
                
                    belief = self.memory.retrieve(queries)
                    
                    self.global_var.update_variables(current_belief = belief)
                    
                    del belief, queries
                    
                    
                #   belief      belief     
                actor_params["history"] =  self.global_var.current_belief
                
                
                
                ac_result = await self.ACagent.execute('actor', params = actor_params, image_paths = image_paths, image_type=self.image_type)
                
                results = [ac_result, memory_update_successes] #       return  
                    
                del memory_infos, actor_params, image_paths
            
            else: #     
                
                #           current belief   
                actor_params["history"] =  self.global_var.current_belief
                
                # Memory      
                
                #      ,     reflectionapt
                actor_params["reflection"] = self.global_var.critic_reflection
                
                    
                task_list = [
                    self.ACagent.execute('actor', params = actor_params, image_paths = image_paths, image_type=self.image_type)
                ]
                
                
                results = await asyncio.gather(*task_list)
                
                # **            critic             True            critic 
                
                self.global_var.update_variables(
                    action_suitability = True, #        True
                    critic_reflection = None
                )
                
                del actor_params, image_paths
            
            #          result
            subgoal, action_plan, params, CoT, return_str = results[0]
            
            self.global_var.update_variables(
                subgoal = subgoal,
                action_plan = action_plan,
                actor_CoT = CoT,
                actor_params = params,
                actor_return = return_str
            )
            
            
            del subgoal, action_plan, CoT, results, return_str, params
                
            ##### Log    #####
            
            actor_params = self.global_var.actor_params.copy()
            
            actor_params.pop('objects')
            actor_params.pop('examples')
            actor_params.pop('functions')
            
            actor_params = yaml.dump( 
                actor_params,# objects   
                indent=2,
                allow_unicode=True,  #     
                default_flow_style=False,  #         
                sort_keys=False       #         
            )
                
            self.logger.console_log(global_step = self.step, returns = actor_params, agent_name = "Input Info") #    belief
            
            self.logger.console_log(global_step = self.step, returns = self.global_var.current_step_summary, agent_name = "Observation") # log    observation
        
            self.logger.console_log(global_step = self.step, returns = self.global_var.actor_return, agent_name = "Actor") # log     
            
            self.logger.log(
                global_step = self.step,
                memory = self.global_var.current_belief,
                obs_image = self.global_var.current_img, #              image    
                obs_text = self.global_var.current_step_summary,
                CoT = self.global_var.actor_CoT,
                AC = "Actor",
                save_inputs = actor_params,
                save_outputs = {
                    "subgoal": self.global_var.subgoal,
                    "action_plan": self.global_var.action_plan
                }
            ) # log   
            
            del actor_params
            
            ####################
            
            #     action
            
            img, score, done, truncated, info = self.env.step(self.global_var.action_plan[0]) # first action
            
            current_action = self.global_var.action_plan[0]
            
            self.step += 1
            
            self.global_var.update_variables(
                global_step = self.step,
                current_img = img,
                score = score,
                done = done,
                truncated = truncated,
                current_info = info,
                current_action = current_action,
            )
            
            #              
            self.memory.save()
            
            # log        
            
            action_str = action_str = (
                f"Task success: {self.global_var.task_success}\n"
                f"Task prograss: {self.global_var.task_progress}\n"
                f"Task done: {self.global_var.done}\n"
                f"Execute Action: {self.global_var.current_action}\n"
                f"Env Feedback:\n{self.global_var.env_feedback_info}" # log      
            )
            
            self.logger.console_log(global_step = self.step, returns = action_str)
            
            del img, score, done, truncated, info, current_action, action_str
            
            if self.use_critic:
                for action in self.global_var.action_plan[1:]: # the rest of actions
                    
                    # preprocess info
                    
                    # **       short-term memory    step summary     
                    
                
                    query_params = {
                        "memory": self.global_var.current_belief,
                        "task": self.env.task
                    }
                    
                    step_sum_params = {
                        "current_action": self.global_var.current_action,
                        "feedback": self.global_var.env_feedback_info,
                        "working_memory": self.global_var.current_step_summary,
                        "current_belief": {
                            "Temporal Memory": self.global_var.current_belief.get("TemporalShortTermMemory", 'No belief available now'),
                            "Spatial Memory": self.global_var.current_belief.get("SpatialMemory", '')
                        },
                        "functions": self.api_descriptions,
                        "examples": self.examples
                    }
                
                    step_summary, spatial_queries, semantic_queries, episodic_queries = await self.info_preprocessor.generate_infos(
                        query_params = query_params,
                        step_sum_params = step_sum_params,
                        image_paths = self.global_var.current_img,
                        image_type = self.image_type
                    )
                    
                    self.global_var.update_variables(
                        current_step_summary = step_summary,
                        current_spatial_queries = spatial_queries,
                        current_semantic_queries = semantic_queries,
                        current_episodic_queries = episodic_queries
                    )

                    
                    
                    del step_summary, spatial_queries, semantic_queries, episodic_queries, query_params, step_sum_params
                    
                    # Memory update (Critic)
                    # infos:    available   information Memory       
                    
                    
                    # Step summary            spatial   temporal memory
                    
                    memory_infos = {
                        "step_summary": self.global_var.current_step_summary,
                        "possible_objects": self.env.objects,
                    }
                    
                    if self.global_var.current_belief != '' and self.global_var.current_belief["TemporalShortTermMemory"] != '':
                        memory_infos['SemanticMemory'] = {
                            "iterations": self.global_var.current_belief.get("TemporalShortTermMemory", 'No belief available now'),
                            "action": self.global_var.current_action,
                            "api_descriptions": self.api_descriptions
                        }
                
                    else:
                        logging.warning(f"No Short term memory for Semantic memory update yet!")
                        
                        
                    
                    
                    image_paths = self.global_var.current_img if self.critic_obs else None
          
                    #     
                    # update -> retrieve -> critic
                    memory_update_successes = await self.memory.update(memory_infos) #            
                    
                    queries = {
                        "SpatialMemory": self.global_var.current_spatial_queries,
                        "SemanticMemory": self.global_var.current_semantic_queries, 
                        "EpisodicMemory": self.global_var.current_episodic_queries 
                    } 
                    
                    self.logger.console_log(global_step = self.step, returns = queries, agent_name = "Queries for spatial memory") 
                
                    
                    belief = self.memory.retrieve(queries)
                
                
                    self.global_var.update_variables(current_belief = belief)
                    
                    del belief, queries
                    
                    # critic
                    #    critic             action            action 
                    critic_params = {
                        "task": self.env.task,
                        "subgoal": self.global_var.subgoal,
                        "functions": self.api_descriptions,
                        "action": action,
                        "objects": self.env.objects,
                        "examples": self.examples,
                        "last_action": self.global_var.last_action
                    }
                    
                    critic_params["history"] = self.global_var.current_belief
                    
                    critic_result = await self.ACagent.execute('critic', params = critic_params, image_paths = image_paths, image_type=self.image_type)

                    results = [memory_update_successes, critic_result]
                        
                    memory_update_successes = results[0] #   memory update      
                    
                    action_suitability, reflection, params, CoT, return_str = results[1]
                    
                    self.global_var.update_variables(
                        action_suitability = action_suitability,
                        critic_reflection = reflection,
                        critic_params = params,
                        critic_CoT = CoT,
                        critic_return = return_str
                    )
                    
                    del action_suitability, reflection, params, CoT, return_str, memory_infos, critic_params, results, image_paths
                
                    ##### Log Critic    #####
                    
                    critic_params = self.global_var.critic_params.copy()
                
                    critic_params.pop('objects')
                    critic_params.pop('examples')
                    critic_params.pop('functions')
                    
                    critic_params = yaml.dump( 
                        critic_params,# objects   
                        indent=2,
                        allow_unicode=True,  #     
                        default_flow_style=False,  #         
                        sort_keys=False       #         
                    )
                    
                    self.logger.console_log(global_step = self.step, returns = critic_params, agent_name = "Input Info") #    belief
                
                    self.logger.console_log(global_step = self.step, returns = self.global_var.current_step_summary, agent_name =  "Observation") # log       observation
                    
                    self.logger.console_log(global_step = self.step, returns = self.global_var.critic_return, agent_name =  "Critic")
                    
                    self.logger.log(
                        global_step = self.global_var.global_step,
                        memory = self.global_var.current_belief,
                        obs_image = self.global_var.current_img, #              image    
                        obs_text = self.global_var.current_step_summary,
                        CoT = self.global_var.critic_CoT,
                        AC = "Critic",
                        save_inputs = critic_params,
                        save_outputs = {
                            "action_suiltability": self.global_var.action_suitability,
                            "reflection": self.global_var.critic_reflection
                        }
                    ) # log   
                    
                    del critic_params
                    
                    ####################
                    
                    if self.global_var.action_suitability:
                        #      
                        img, score, done, truncated, info = self.env.step(action) # first action
                        self.step += 1
                        
                        #     
                        self.global_var.update_variables(
                            current_action = action,
                            global_step = self.step,
                            score = score,
                            current_img = img,
                            done = done,
                            current_info = info,
                            truncated = truncated
                        )
                        
                        #              
                        self.memory.save()
                        
                        # log        
                
                        action_str = (
                            f"Task success: {self.global_var.task_success}\n"
                            f"Task prograss: {self.global_var.task_progress}\n"
                            f"Task done: {self.global_var.done}\n"
                            f"Execute Action: {self.global_var.current_action}\n"
                            f"Env Feedback:\n{self.global_var.env_feedback_info}" # log      
                        )
                        
                        self.logger.console_log(global_step = self.step, returns = action_str)
                        
                        del img, score, done, truncated, info, action_str
                        
                        if self.step > self.max_step: #                 
                            #       
                            truncated = True
                            self.global_var.update_variables(done = True)

                    else:
                        del action
                        break
            
                if self.step > self.max_step:
                    #       
                    truncated = True
                    self.global_var.update_variables(done = True)
            
            if self.step > self.max_step:
                #       
                truncated = True
                self.global_var.update_variables(done = True)
        
        return
        
        
            
def long_term_memory_update(
        memory: BaseMemory, 
        global_var: ALFERDVariableManager, 
        env: ALFREDEnv
    ):
   
    
    #                
    #       belief         
    
    #                  
    pass
        
        
if __name__ == "__main__":
    
    #    log
    logging.basicConfig(
        level=logging.INFO,  #
        format='%(asctime)s - %(name)s - %(levelname)s - %(message)s',
        filemode='a'  #     
    )
    
    config_72_vl_ali = ModelConfig( #     32b   
        model = "qwen2.5-vl-72b-instruct",
        base_url = BASE_URL,
        api_key =  API_KEY,
        temperature = 0
    )
    
    embedding_config = ModelConfig(
        model="text-embedding-v4",
        base_url=BASE_URL,
        api_key=API_KEY
    )
    
    #          for       
    # 15      
    # [0, 2, 4, 5, 7, 10, 15, 20, 26, 31, 48]
    # 0, 4, 5, 7, 10, 15, 20, 26, 
    #      :
    already_list = list(range(44)) + [45, 48]
    type_indexes = [0]
    task_indexes = [2, 7, 10, 15, 20, 26, 31, 48] # 5-3, 7   bug , 0-5  bug
    # 5-3, 7   bug , 0-5  bug
    
    # 44     
    
    total_task = len(task_indexes) * len(type_indexes)
    task_num = 0
    
    tolerance = 3
    
    for type_index in type_indexes:
        for task_index in task_indexes:
            
            logging.info(f"[{task_num + 1}/{total_task}] task {type_index}-{task_index} START")
            
            #    Memory
            
            for t in range(tolerance): #             
                
                logging.info(f"RETRY[{t}/{tolerance}]")
                
                try:
                    
                    
                    agent = ALFREDRoboMemoryAgent(
                        
                        # Actor-Critic
                        actor_config=config_72_vl_ali,
                        critic_config=config_72_vl_ali,
                        actor_prompt_path="./RoboMemory/templates/prompts/Planner.prompt",
                        critic_prompt_path="./RoboMemory/templates/prompts/Critic.prompt",
                        
                        # Infomation Gathering
                        step_summarizer_config=config_72_vl_ali,
                        spatial_query_generator_config=config_72_vl_ali,
                        semantic_query_generator_config=config_72_vl_ali,
                        episodic_query_generator_config=config_72_vl_ali,
                        
                        step_summarizer_prompt="./RoboMemory/templates/prompts/StepSumGenerator.prompt",
                        spatial_query_generator_prompt="./RoboMemory/templates/prompts/Query_Generators/SpatialQueryGenerator.prompt",
                        semantic_query_generator_prompt="./RoboMemory/templates/prompts/Query_Generators/SemanticQueryGenerator.prompt",
                        episodic_query_generator_prompt="./RoboMemory/templates/prompts/Query_Generators/EpisodicQueryGenerator.prompt",
                        
                        # Spatial-Temporal Short-term Memory
                        temporal_short_term_memory_config=config_72_vl_ali,
                        spatial_short_term_memory_config=config_72_vl_ali,
                        embedding_config=embedding_config,
                        
                        # long-term memories
                        semantic_memory_generator_config=config_72_vl_ali,
                        semantic_memory_upater_config=config_72_vl_ali,
                        semantic_memory_extractor_config=config_72_vl_ali,
                        episodic_memory_generator_config=config_72_vl_ali,
                        
                        
                        #    env
                        function_filter_list = [],
                        selected_indexes = task_index,
                        eval_set_index = type_index
                    )
                    
                    error = asyncio.run(agent.run())
                    
                    time.sleep(5)
                        
                    if error:
                        
                        logging.error(f"[{task_num + 1}/{total_task}] task {type_index}-{task_index} INNER LOOP ERROR")
                        
                        continue
                    else:
                        break #         
                
                except Exception as e:
                    
                    logging.error(f"[{task_num + 1}/{total_task}] task {type_index}-{task_index} OUTER LOOP ERROR: {str(e)}")
                    
                    # raise e
                    
                    continue
            
            logging.info(f"[{task_num + 1}/{total_task}] task {type_index}-{task_index} END")
            
            task_num += 1
    
    
        
    
    