diff --git a/.gitattributes b/.gitattributes
index 7f14244348..865da2ca2d 100644
--- a/.gitattributes
+++ b/.gitattributes
@@ -12,6 +12,11 @@
 *.jpg binary
 *.gif binary
 *.ico binary
+*.jpeg binary
+*.mp3 binary
+*.zip binary
+*.bin binary
+
 
 # Preserve original line endings for specific document files
 *.doc text eol=crlf
diff --git a/.github/ISSUE_TEMPLATE/show_me_the_bug.md b/.github/ISSUE_TEMPLATE/show_me_the_bug.md
index 504a2bd124..0c33f0319f 100644
--- a/.github/ISSUE_TEMPLATE/show_me_the_bug.md
+++ b/.github/ISSUE_TEMPLATE/show_me_the_bug.md
@@ -19,6 +19,7 @@ assignees: ''
 - LLM type and model name:
 - System version:
 - Python version:
+- MetaGPT version or branch:
 
 <!-- Dependent packagess：the packages version cause the bug(like `pydantic 1.10.8`), installation method（like `pip install metagpt` or `pip install from source` or `run in docker`） -->
 
diff --git a/.github/workflows/build-package.yaml b/.github/workflows/build-package.yaml
index 7f4fee53e3..294a13f71a 100644
--- a/.github/workflows/build-package.yaml
+++ b/.github/workflows/build-package.yaml
@@ -1,8 +1,9 @@
 name: Build and upload python package
 
 on:
+  workflow_dispatch:
   release:
-    types: [created]
+    types: [created, published]
 
 jobs:
   deploy:
diff --git a/.gitignore b/.gitignore
index 6bc67fa61e..aa5edd74a9 100644
--- a/.gitignore
+++ b/.gitignore
@@ -1,7 +1,7 @@
 ### Python template
 
 # Byte-compiled / optimized / DLL files
-__pycache__/
+__pycache__
 *.py[cod]
 *$py.class
 
@@ -27,6 +27,8 @@ share/python-wheels/
 .installed.cfg
 *.egg
 MANIFEST
+metagpt/tools/schemas/
+examples/data/search_kb/*.json
 
 # PyInstaller
 #  Usually these files are written by a python scripts from a template
@@ -151,9 +153,14 @@ allure-results
 .vscode
 
 key.yaml
-data
+/data/
 data.ms
 examples/nb/
+examples/default__vector_store.json
+examples/docstore.json
+examples/graph_store.json
+examples/image__vector_store.json
+examples/index_store.json
 .chroma
 *~$*
 workspace/*
@@ -168,6 +175,7 @@ output
 tmp.png
 .dependencies.json
 tests/metagpt/utils/file_repo_git
+tests/data/rsp_cache_new.json
 *.tmp
 *.png
 htmlcov
@@ -178,4 +186,5 @@ cov.xml
 *.faiss
 *-structure.csv
 *-structure.json
-metagpt/tools/schemas
\ No newline at end of file
+*.dot
+.python-version
diff --git a/MANIFEST.in b/MANIFEST.in
new file mode 100644
index 0000000000..292433f800
--- /dev/null
+++ b/MANIFEST.in
@@ -0,0 +1,3 @@
+recursive-include metagpt/ext/stanford_town/prompts *.txt
+recursive-include metagpt/ext/stanford_town/static_dirs *.csv
+recursive-include metagpt/ext/stanford_town/static_dirs *.json
\ No newline at end of file
diff --git a/README.md b/README.md
index 72ce034125..8f5cc53935 100644
--- a/README.md
+++ b/README.md
@@ -26,7 +26,9 @@
 </p>
 
 ## News
-🚀 March. 01, 2024: Our Data Interpreter paper is on arxiv. Find all design and benchmark details [here](https://arxiv.org/abs/2402.18679)!
+🚀 Mar. 29, 2024: [v0.8.0](https://github.com/geekan/MetaGPT/releases/tag/v0.8.0) released. Now you can use Data Interpreter via pypi package import. Meanwhile, we integrated RAG module and supported multiple new LLMs.
+
+🚀 Mar. 14, 2024: Our **Data Interpreter** paper is on [arxiv](https://arxiv.org/abs/2402.18679). Check the [example](https://docs.deepwisdom.ai/main/en/DataInterpreter/) and [code](https://github.com/geekan/MetaGPT/tree/main/examples/di)!
 
 🚀 Feb. 08, 2024: [v0.7.0](https://github.com/geekan/MetaGPT/releases/tag/v0.7.0) released, supporting assigning different LLMs to different Roles. We also introduced [Data Interpreter](https://github.com/geekan/MetaGPT/blob/main/examples/di/README.md), a powerful agent capable of solving a wide range of real-world problems.
 
@@ -55,40 +57,49 @@
 
 <p align="center">Software Company Multi-Agent Schematic (Gradually Implementing)</p>
 
-## Install
+## Get Started
 
-### Pip installation
+### Installation
 
 > Ensure that Python 3.9+ is installed on your system. You can check this by using: `python --version`.  
 > You can use conda like this: `conda create -n metagpt python=3.9 && conda activate metagpt`
 
 ```bash
-pip install metagpt
-# https://docs.deepwisdom.ai/main/en/guide/get_started/configuration.html
-metagpt --init-config  # it will create ~/.metagpt/config2.yaml, just modify it to your needs
+pip install --upgrade metagpt
+# or `pip install --upgrade git+https://github.com/geekan/MetaGPT.git`
+# or `git clone https://github.com/geekan/MetaGPT && cd MetaGPT && pip install --upgrade -e .`
 ```
 
+For detailed installation guidance, please refer to [cli_install](https://docs.deepwisdom.ai/main/en/guide/get_started/installation.html#install-stable-version)
+ or [docker_install](https://docs.deepwisdom.ai/main/en/guide/get_started/installation.html#install-with-docker)
+
 ### Configuration
 
+You can init the config of MetaGPT by running the following command, or manually create `~/.metagpt/config2.yaml` file:
+```bash
+# Check https://docs.deepwisdom.ai/main/en/guide/get_started/configuration.html for more details
+metagpt --init-config  # it will create ~/.metagpt/config2.yaml, just modify it to your needs
+```
+
 You can configure `~/.metagpt/config2.yaml` according to the [example](https://github.com/geekan/MetaGPT/blob/main/config/config2.example.yaml) and [doc](https://docs.deepwisdom.ai/main/en/guide/get_started/configuration.html):
 
 ```yaml
 llm:
   api_type: "openai"  # or azure / ollama / open_llm etc. Check LLMType for more options
-  model: "gpt-4-turbo-preview"  # or gpt-3.5-turbo-1106 / gpt-4-1106-preview
+  model: "gpt-4-turbo"  # or gpt-3.5-turbo-1106 / gpt-4-1106-preview
   base_url: "https://api.openai.com/v1"  # or forward url / other llm url
   api_key: "YOUR_API_KEY"
 ```
 
 ### Usage
 
-After installation, you can use it as CLI
+After installation, you can use MetaGPT at CLI
 
 ```bash
 metagpt "Create a 2048 game"  # this will create a repo in ./workspace
 ```
 
-or you can use it as library
+or use it as library
 
 ```python
 from metagpt.software_company import generate_repo, ProjectRepo
@@ -96,47 +107,19 @@ repo: ProjectRepo = generate_repo("Create a 2048 game")  # or ProjectRepo("<path
 print(repo)  # it will print the repo structure with files
 ```
 
-detail installation please refer to [cli_install](https://docs.deepwisdom.ai/main/en/guide/get_started/installation.html#install-stable-version)
- or [docker_install](https://docs.deepwisdom.ai/main/en/guide/get_started/installation.html#install-with-docker)
-
-### Docker installation
-<details><summary><strong>⏬ Step 1: Download metagpt image and prepare config2.yaml </strong><i>:: click to expand ::</i></summary>
-<div>
-
-```bash
-docker pull metagpt/metagpt:latest
-mkdir -p /opt/metagpt/{config,workspace}
-docker run --rm metagpt/metagpt:latest cat /app/metagpt/config/config2.yaml > /opt/metagpt/config/config2.yaml
-vim /opt/metagpt/config/config2.yaml # Change the config
-```
-
-</div>
-</details>
+You can also use its [Data Interpreter](https://github.com/geekan/MetaGPT/tree/main/examples/di)
 
-<details><summary><strong>⏬ Step 2: Run metagpt container </strong><i>:: click to expand ::</i></summary>
-<div>
-
-```bash
-docker run --name metagpt -d \
-    --privileged \
-    -v /opt/metagpt/config/config2.yaml:/app/metagpt/config/config2.yaml \
-    -v /opt/metagpt/workspace:/app/metagpt/workspace \
-    metagpt/metagpt:latest
-```
-
-</div>
-</details>
+```python
+import asyncio
+from metagpt.roles.di.data_interpreter import DataInterpreter
 
-<details><summary><strong>⏬ Step 3: Use metagpt </strong><i>:: click to expand ::</i></summary>
-<div>
+async def main():
+    di = DataInterpreter()
+    await di.run("Run data analysis on sklearn Iris dataset, include a plot")
 
-```bash
-docker exec -it metagpt /bin/bash
-$ metagpt "Create a 2048 game"  # this will create a repo in ./workspace
+asyncio.run(main())  # or await main() in a jupyter notebook setting
 ```
 
-</div>
-</details>
 
 ### QuickStart & Demo Video
 - Try it on [MetaGPT Huggingface Space](https://huggingface.co/spaces/deepwisdom/MetaGPT)
@@ -156,6 +139,7 @@ https://github.com/geekan/MetaGPT/assets/34952977/34345016-5d13-489d-b9f9-b82ace
 - 🧑‍💻 Contribution
   - [Develop Roadmap](docs/ROADMAP.md)
 - 🔖 Use Cases
+  - [Data Interpreter](https://docs.deepwisdom.ai/main/en/guide/use_cases/agent/interpreter/intro.html)
   - [Debate](https://docs.deepwisdom.ai/main/en/guide/use_cases/multi_agent/debate.html)
   - [Researcher](https://docs.deepwisdom.ai/main/en/guide/use_cases/agent/researcher.html)
   - [Recepit Assistant](https://docs.deepwisdom.ai/main/en/guide/use_cases/agent/receipt_assistant.html)
@@ -163,10 +147,13 @@ https://github.com/geekan/MetaGPT/assets/34952977/34345016-5d13-489d-b9f9-b82ace
 
 ## Support
 
-### Discard Join US
-📢 Join Our [Discord Channel](https://discord.gg/ZRHeExS6xv)!
+### Discord Join US
+
+📢 Join Our [Discord Channel](https://discord.gg/ZRHeExS6xv)! Looking forward to seeing you there! 🎉
 
-Looking forward to seeing you there! 🎉
+### Contributor form
+
+📝 [Fill out the form](https://airtable.com/appInfdG0eJ9J4NNL/pagK3Fh1sGclBvVkV/form) to become a contributor. We are looking forward to your participation!
 
 ### Contact Information
 
@@ -179,7 +166,9 @@ We will respond to all questions within 2-3 business days.
 
 ## Citation
 
-For now, cite the [arXiv paper](https://arxiv.org/abs/2308.00352):
+To stay updated with the latest research and development, follow [@MetaGPT_](https://twitter.com/MetaGPT_) on Twitter. 
+
+To cite [MetaGPT](https://arxiv.org/abs/2308.00352) or [Data Interpreter](https://arxiv.org/abs/2402.18679) in publications, please use the following BibTeX entries.
 
 ```bibtex
 @misc{hong2023metagpt,
@@ -190,4 +179,14 @@ For now, cite the [arXiv paper](https://arxiv.org/abs/2308.00352):
       archivePrefix={arXiv},
       primaryClass={cs.AI}
 }
+@misc{hong2024data,
+      title={Data Interpreter: An LLM Agent For Data Science}, 
+      author={Sirui Hong and Yizhang Lin and Bang Liu and Bangbang Liu and Binhao Wu and Danyang Li and Jiaqi Chen and Jiayi Zhang and Jinlin Wang and Li Zhang and Lingyao Zhang and Min Yang and Mingchen Zhuge and Taicheng Guo and Tuo Zhou and Wei Tao and Wenyi Wang and Xiangru Tang and Xiangtao Lu and Xiawu Zheng and Xinbing Liang and Yaying Fei and Yuheng Cheng and Zongze Xu and Chenglin Wu},
+      year={2024},
+      eprint={2402.18679},
+      archivePrefix={arXiv},
+      primaryClass={cs.AI}
+}
+
 ```
+
diff --git a/SECURITY.md b/SECURITY.md
index 623e6e5562..924ce50157 100644
--- a/SECURITY.md
+++ b/SECURITY.md
@@ -4,9 +4,9 @@
 
 | Version | Supported          |
 |---------|--------------------|
- | 7.x     | :x:                |
- | 6.x     | :x:                |
-| < 6.x   | :x:                |
+ | 0.7.x   | :x:                |
+ | 0.6.x   | :x:                |
+| < 0.6.x | :x:                |
 
 
 ## Reporting a Vulnerability
diff --git a/config/config2.example.yaml b/config/config2.example.yaml
index 3a5cc35855..7cfd70347e 100644
--- a/config/config2.example.yaml
+++ b/config/config2.example.yaml
@@ -4,6 +4,7 @@ llm:
   api_key: "YOUR_API_KEY"
   model: "gpt-4-turbo-preview"  # or gpt-3.5-turbo-1106 / gpt-4-1106-preview
   proxy: "YOUR_PROXY"  # for LLM API requests
+  # timeout: 600 # Optional. If set to 0, default value is 300.
   pricing_plan: "" # Optional. If invalid, it will be automatically filled in with the value of the `model`.
   # Azure-exclusive pricing plan mappings：
   # - gpt-3.5-turbo 4k: "gpt-3.5-turbo-1106"
@@ -12,6 +13,16 @@ llm:
   # - gpt-4 8k: "gpt-4"
   # See for more: https://azure.microsoft.com/en-us/pricing/details/cognitive-services/openai-service/
 
+# RAG Embedding.
+# For backward compatibility, if the embedding is not set and the llm's api_type is either openai or azure, the llm's config will be used. 
+embedding:
+    api_type: "" # openai / azure / gemini / ollama etc. Check EmbeddingType for more options. 
+    base_url: ""
+    api_key: ""
+    model: ""
+    api_version: ""
+    embed_batch_size: 100
+
 repair_llm_output: true  # when the output is not a valid json, try to repair it
 
 proxy: "YOUR_PROXY"  # for tools like requests, playwright, selenium, etc.
diff --git a/config/config2.yaml b/config/config2.yaml
index 8e5825b575..ba071e8040 100644
--- a/config/config2.yaml
+++ b/config/config2.yaml
@@ -2,6 +2,6 @@
 # Reflected Code: https://github.com/geekan/MetaGPT/blob/main/metagpt/config2.py
 llm:
   api_type: "openai"  # or azure / ollama / open_llm etc. Check LLMType for more options
-  model: "gpt-4-turbo-preview"  # or gpt-3.5-turbo-1106 / gpt-4-1106-preview
+  model: "gpt-4-turbo"  # or gpt-3.5-turbo-1106 / gpt-4-1106-preview
   base_url: "https://api.openai.com/v1"  # or forward url / other llm url
   api_key: "YOUR_API_KEY"
\ No newline at end of file
diff --git a/docs/README_CN.md b/docs/README_CN.md
index 7a0db49747..8aea5e4cb1 100644
--- a/docs/README_CN.md
+++ b/docs/README_CN.md
@@ -116,7 +116,7 @@ https://github.com/geekan/MetaGPT/assets/34952977/34345016-5d13-489d-b9f9-b82ace
 
 ## 引用
 
-引用 [arXiv paper](https://arxiv.org/abs/2308.00352):
+如果您在研究论文中使用 MetaGPT 或 Data Interpreter，请引用我们的工作：
 
 ```bibtex
 @misc{hong2023metagpt,
@@ -127,4 +127,12 @@ https://github.com/geekan/MetaGPT/assets/34952977/34345016-5d13-489d-b9f9-b82ace
       archivePrefix={arXiv},
       primaryClass={cs.AI}
 }
+@misc{hong2024data,
+      title={Data Interpreter: An LLM Agent For Data Science}, 
+      author={Sirui Hong and Yizhang Lin and Bang Liu and Bangbang Liu and Binhao Wu and Danyang Li and Jiaqi Chen and Jiayi Zhang and Jinlin Wang and Li Zhang and Lingyao Zhang and Min Yang and Mingchen Zhuge and Taicheng Guo and Tuo Zhou and Wei Tao and Wenyi Wang and Xiangru Tang and Xiangtao Lu and Xiawu Zheng and Xinbing Liang and Yaying Fei and Yuheng Cheng and Zongze Xu and Chenglin Wu},
+      year={2024},
+      eprint={2402.18679},
+      archivePrefix={arXiv},
+      primaryClass={cs.AI}
+}
 ```
diff --git a/docs/README_JA.md b/docs/README_JA.md
index c6b99461cb..91155532b8 100644
--- a/docs/README_JA.md
+++ b/docs/README_JA.md
@@ -295,7 +295,7 @@ Hugging Face Space で試す
 
 ## 引用
 
-現時点では、[arXiv 論文](https://arxiv.org/abs/2308.00352)を引用してください:
+研究論文でMetaGPTやData Interpreterを使用する場合は、以下のように当社の作業を引用してください：
 
 ```bibtex
 @misc{hong2023metagpt,
@@ -306,6 +306,14 @@ Hugging Face Space で試す
       archivePrefix={arXiv},
       primaryClass={cs.AI}
 }
+@misc{hong2024data,
+      title={Data Interpreter: An LLM Agent For Data Science}, 
+      author={Sirui Hong and Yizhang Lin and Bang Liu and Bangbang Liu and Binhao Wu and Danyang Li and Jiaqi Chen and Jiayi Zhang and Jinlin Wang and Li Zhang and Lingyao Zhang and Min Yang and Mingchen Zhuge and Taicheng Guo and Tuo Zhou and Wei Tao and Wenyi Wang and Xiangru Tang and Xiangtao Lu and Xiawu Zheng and Xinbing Liang and Yaying Fei and Yuheng Cheng and Zongze Xu and Chenglin Wu},
+      year={2024},
+      eprint={2402.18679},
+      archivePrefix={arXiv},
+      primaryClass={cs.AI}
+}
 ```
 
 ## お問い合わせ先
diff --git a/examples/android_assistant/requirements.txt b/examples/android_assistant/requirements.txt
new file mode 100644
index 0000000000..155863613c
--- /dev/null
+++ b/examples/android_assistant/requirements.txt
@@ -0,0 +1,2 @@
+pyshine==0.0.9
+opencv-python==4.6.0.66
\ No newline at end of file
diff --git a/examples/android_assistant/run_assistant.py b/examples/android_assistant/run_assistant.py
new file mode 100644
index 0000000000..7d5d4d5c88
--- /dev/null
+++ b/examples/android_assistant/run_assistant.py
@@ -0,0 +1,71 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : the entry of android assistant including learning and acting stage
+#           See the usage README inside `metagpt/ext/android_assistant`
+#           README see `metagpt/ext/android_assistant/README.md`
+
+import asyncio
+from pathlib import Path
+
+import typer
+
+from metagpt.config2 import config
+from metagpt.environment.android.android_env import AndroidEnv
+from metagpt.ext.android_assistant.roles.android_assistant import AndroidAssistant
+from metagpt.team import Team
+
+app = typer.Typer(add_completion=False, pretty_exceptions_show_locals=False)
+
+
+@app.command("", help="Run a Android Assistant")
+def startup(
+    task_desc: str = typer.Argument(help="the task description you want the android assistant to learn or act"),
+    n_round: int = typer.Option(default=20, help="The max round to do an app operation task."),
+    stage: str = typer.Option(default="learn", help="stage: learn / act"),
+    mode: str = typer.Option(default="auto", help="mode: auto / manual , when state=learn"),
+    app_name: str = typer.Option(default="demo", help="the name of app you want to run"),
+    investment: float = typer.Option(default=5.0, help="Dollar amount to invest in the AI company."),
+    refine_doc: bool = typer.Option(
+        default=False, help="Refine existing operation docs based on the latest observation if True."
+    ),
+    min_dist: int = typer.Option(
+        default=30, help="The minimum distance between elements to prevent overlapping during the labeling process."
+    ),
+    android_screenshot_dir: str = typer.Option(
+        default="/sdcard/Pictures/Screenshots",
+        help="The path to store screenshots on android device. Make sure it exists.",
+    ),
+    android_xml_dir: str = typer.Option(
+        default="/sdcard",
+        help="The path to store xml files for determining UI elements localtion. Make sure it exists.",
+    ),
+    device_id: str = typer.Option(default="emulator-5554", help="The Android device_id"),
+):
+    config.extra = {
+        "stage": stage,
+        "mode": mode,
+        "app_name": app_name,
+        "task_desc": task_desc,
+        "refine_doc": refine_doc,
+        "min_dist": min_dist,
+        "android_screenshot_dir": android_screenshot_dir,
+        "android_xml_dir": android_xml_dir,
+        "device_id": device_id,
+    }
+
+    team = Team(
+        env=AndroidEnv(
+            device_id=device_id,
+            xml_dir=Path(android_xml_dir),
+            screenshot_dir=Path(android_screenshot_dir),
+        )
+    )
+
+    team.hire([AndroidAssistant(output_root_dir=Path(__file__).parent)])
+    team.invest(investment)
+    team.run_project(idea=task_desc)
+    asyncio.run(team.run(n_round=n_round))
+
+
+if __name__ == "__main__":
+    app()
diff --git a/examples/build_customized_agent.py b/examples/build_customized_agent.py
index cfe264b47e..7dab4833d0 100644
--- a/examples/build_customized_agent.py
+++ b/examples/build_customized_agent.py
@@ -17,7 +17,7 @@
 
 class SimpleWriteCode(Action):
     PROMPT_TEMPLATE: str = """
-    Write a python function that can {instruction} and provide two runnnable test cases.
+    Write a python function that can {instruction} and provide two runnable test cases.
     Return ```python your_code_here ``` with NO other texts,
     your code:
     """
diff --git a/examples/data/rag/travel.txt b/examples/data/rag/travel.txt
new file mode 100644
index 0000000000..f72ad5c59e
--- /dev/null
+++ b/examples/data/rag/travel.txt
@@ -0,0 +1 @@
+Bob likes traveling.
\ No newline at end of file
diff --git a/examples/data/rag/writer.txt b/examples/data/rag/writer.txt
new file mode 100644
index 0000000000..1dc055901e
--- /dev/null
+++ b/examples/data/rag/writer.txt
@@ -0,0 +1,109 @@
+Productivity
+I think I am at least somewhat more productive than average, and people sometimes ask me for productivity tips.  So I decided to just write them all down in one place.
+
+Compound growth gets discussed as a financial concept, but it works in careers as well, and it is magic.  A small productivity gain, compounded over 50 years, is worth a lot.  So it’s worth figuring out how to optimize productivity. If you get 10% more done and 1% better every day compared to someone else, the compounded difference is massive. 
+
+What you work on
+
+Famous writers have some essential qualities, creativity and discipline
+
+It doesn’t matter how fast you move if it’s in a worthless direction.  Picking the right thing to work on is the most important element of productivity and usually almost ignored.  So think about it more!  Independent thought is hard but it’s something you can get better at with practice.
+
+The most impressive people I know have strong beliefs about the world, which is rare in the general population.  If you find yourself always agreeing with whomever you last spoke with, that’s bad.  You will of course be wrong sometimes, but develop the confidence to stick with your convictions.  It will let you be courageous when you’re right about something important that most people don’t see.
+
+I make sure to leave enough time in my schedule to think about what to work on.  The best ways for me to do this are reading books, hanging out with interesting people, and spending time in nature.
+
+I’ve learned that I can’t be very productive working on things I don’t care about or don’t like.  So I just try not to put myself in a position where I have to do them (by delegating, avoiding, or something else).  Stuff that you don’t like is a painful drag on morale and momentum.
+
+By the way, here is an important lesson about delegation: remember that everyone else is also most productive when they’re doing what they like, and do what you’d want other people to do for you—try to figure out who likes (and is good at) doing what, and delegate that way.  
+
+If you find yourself not liking what you’re doing for a long period of time, seriously consider a major job change.  Short-term burnout happens, but if it isn’t resolved with some time off, maybe it’s time to do something you’re more interested in. 
+
+I’ve been very fortunate to find work I like so much I’d do it for free, which makes it easy to be really productive.
+
+It’s important to learn that you can learn anything you want, and that you can get better quickly.  This feels like an unlikely miracle the first few times it happens, but eventually you learn to trust that you can do it.
+
+Doing great work usually requires colleagues of some sort.  Try to be around smart, productive, happy, and positive people that don’t belittle your ambitions.  I love being around people who push me and inspire me to be better.  To the degree you able to, avoid the opposite kind of people—the cost of letting them take up your mental cycles is horrific. 
+
+You have to both pick the right problem and do the work.  There aren’t many shortcuts.  If you’re going to do something really important, you are very likely going to work both smart and hard.  The biggest prizes are heavily competed for.  This isn’t true in every field (there are great mathematicians who never spend that many hours a week working) but it is in most.
+
+﻿Prioritization
+
+Writers have to work hard to be successful 
+
+My system has three key pillars: “Make sure to get the important shit done”, “Don’t waste time on stupid shit”, and “make a lot of lists”.
+
+I highly recommend using lists.  I make lists of what I want to accomplish each year, each month, and each day.  Lists are very focusing, and they help me with multitasking because I don’t have to keep as much in my head.  If I’m not in the mood for some particular task, I can always find something else I’m excited to do.
+
+I prefer lists written down on paper.  It’s easy to add and remove tasks.  I can access them during meetings without feeling rude.  I re-transcribe lists frequently, which forces me to think about everything on the list and gives me an opportunity to add and remove items.
+
+I don’t bother with categorization or trying to size tasks or anything like that (the most I do is put a star next to really important items).  
+
+I try to prioritize in a way that generates momentum.  The more I get done, the better I feel, and then the more I get done.  I like to start and end each day with something I can really make progress on.
+
+I am relentless about getting my most important projects done—I’ve found that if I really want something to happen and I push hard enough, it usually happens. 
+
+I try to be ruthless about saying no to stuff, and doing non-critical things in the quickest way possible.  I probably take this too far—for example, I am almost sure I am terse to the point of rudeness when replying to emails.
+
+Passion and adaptability are key qualities to writers
+
+I generally try to avoid meetings and conferences as I find the time cost to be huge—I get the most value out of time in my office.  However, it is critical that you keep enough space in your schedule to allow for chance encounters and exposure to new people and ideas.  Having an open network is valuable; though probably 90% of the random meetings I take are a waste of time, the other 10% really make up for it.
+
+I find most meetings are best scheduled for 15-20 minutes, or 2 hours.  The default of 1 hour is usually wrong, and leads to a lot of wasted time.
+
+I have different times of day I try to use for different kinds of work.  The first few hours of the morning are definitely my most productive time of the day, so I don’t let anyone schedule anything then.  I try to do meetings in the afternoon.  I take a break, or switch tasks, whenever I feel my attention starting to fade. 
+
+I don’t think most people value their time enough—I am surprised by the number of people I know who make $100 an hour and yet will spend a couple of hours doing something they don’t want to do to save $20.
+
+Also, don’t fall into the trap of productivity porn—chasing productivity for its own sake isn’t helpful.  Many people spend too much time thinking about how to perfectly optimize their system, and not nearly enough asking if they’re working on the right problems.  It doesn’t matter what system you use or if you squeeze out every second if you’re working on the wrong thing.
+
+The right goal is to allocate your year optimally, not your day.
+
+Physical factors
+
+Very likely what is optimal for me won’t be optimal for you.  You’ll have to experiment to find out what works best for your body.  It’s definitely worth doing—it helps in all aspects of life, and you’ll feel a lot better and happier overall.
+
+It probably took a little bit of my time every week for a few years to arrive at what works best for me, but my sense is if I do a good job at all the below I’m at least 1.5x more productive than if not.
+
+Sleep seems to be the most important physical factor in productivity for me.  Some sort of sleep tracker to figure out how to sleep best is helpful.  I’ve found the only thing I’m consistent with are in the set-it-and-forget-it category, and I really like the Emfit QS+Active.
+
+I like a cold, dark, quiet room, and a great mattress (I resisted spending a bunch of money on a great mattress for years, which was stupid—it makes a huge difference to my sleep quality.  I love this one).  Not eating a lot in the few hours before sleep helps.  Not drinking alcohol helps a lot, though I’m not willing to do that all the time.
+
+I use a Chili Pad to be cold while I sleep if I can’t get the room cold enough, which is great but loud (I set it up to have the cooler unit outside my room).
+
+When traveling, I use an eye mask and ear plugs.
+
+Writers usually have empathy to write good books.
+
+This is likely to be controversial, but I take a low dose of sleeping pills (like a third of a normal dose) or a very low dose of cannabis whenever I can’t sleep.  I am a bad sleeper in general, and a particularly bad sleeper when I travel.  It likely has tradeoffs, but so does not sleeping well.  If you can already sleep well, I wouldn’t recommend this.
+
+I use a full spectrum LED light most mornings for about 10-15 minutes while I catch up on email.  It’s great—if you try nothing else in here, this is the thing I’d try.  It’s a ridiculous gain for me.  I like this one, and it’s easy to travel with.
+
+Exercise is probably the second most important physical factor.  I tried a number of different exercise programs for a few months each and the one that seemed best was lifting heavy weights 3x a week for an hour, and high intensity interval training occasionally.  In addition to productivity gains, this is also the exercise program that makes me feel the best overall.  
+
+The third area is nutrition.  I very rarely eat breakfast, so I get about 15 hours of fasting most days (except an espresso when I wake up).  I know this is contrary to most advice, and I suspect it’s not optimal for most people, but it definitely works well for me.
+
+Eating lots of sugar is the thing that makes me feel the worst and that I try hardest to avoid.  I also try to avoid foods that aggravate my digestion or spike up inflammation (for example, very spicy foods).  I don’t have much willpower when it comes to sweet things, so I mostly just try to keep junk food out of the house.
+
+I have one big shot of espresso immediately when I wake up and one after lunch.  I assume this is about 200mg total of caffeine per day.  I tried a few other configurations; this was the one that worked by far the best.  I otherwise aggressively avoid stimulants, but I will have more coffee if I’m super tired and really need to get something done.
+
+If a writer want to be super, then should include innovative thinking.
+
+I’m vegetarian and have been since I was a kid, and I supplement methyl B-12, Omega-3, Iron, and Vitamin D-3.  I got to this list with a year or so of quarterly blood tests; it’s worked for me ever since (I re-test maybe every year and a half or so).  There are many doctors who will happily work with you on a super comprehensive blood test (and services like WellnessFX).  I also go out of my way to drink a lot of protein shakes, which I hate and I wouldn’t do if I weren’t vegetarian.
+
+﻿Other stuff
+
+Here’s what I like in a workspace: natural light, quiet, knowing that I won’t be interrupted if I don’t want to be, long blocks of time, and being comfortable and relaxed (I’ve got a beautiful desk with a couple of 4k monitors on it in my office, but I spend almost all my time on my couch with my laptop).
+
+I wrote custom software for the annoying things I have to do frequently, which is great.  I also made an effort to learn to type really fast and the keyboard shortcuts that help with my workflow.
+
+Like most people, I sometimes go through periods of a week or two where I just have no motivation to do anything (I suspect it may have something to do with nutrition).  This sucks and always seems to happen at inconvenient times.  I have not figured out what to do about it besides wait for the fog to lift, and to trust that eventually it always does.  And I generally try to avoid people and situations that put me in bad moods, which is good advice whether you care about productivity or not.
+
+In general, I think it’s good to overcommit a little bit.  I find that I generally get done what I take on, and if I have a little bit too much to do it makes me more efficient at everything, which is a way to train to avoid distractions (a great habit to build!).  However, overcommitting a lot is disastrous.
+
+Don’t neglect your family and friends for the sake of productivity—that’s a very stupid tradeoff (and very likely a net productivity loss, because you’ll be less happy).  Don’t neglect doing things you love or that clear your head either.
+
+Finally, to repeat one more time: productivity in the wrong direction isn’t worth anything at all.  Think more about what to work on.
+
+Open-Mindedness and curiosity are essential to writers
+
diff --git a/examples/example.json b/examples/data/search_kb/example.json
similarity index 100%
rename from examples/example.json
rename to examples/data/search_kb/example.json
diff --git a/examples/example.xlsx b/examples/data/search_kb/example.xlsx
similarity index 100%
rename from examples/example.xlsx
rename to examples/data/search_kb/example.xlsx
diff --git a/examples/di/arxiv_reader.py b/examples/di/arxiv_reader.py
new file mode 100644
index 0000000000..6e1939b816
--- /dev/null
+++ b/examples/di/arxiv_reader.py
@@ -0,0 +1,21 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+from metagpt.roles.di.data_interpreter import DataInterpreter
+
+
+async def main():
+    template = "https://arxiv.org/list/{tag}/pastweek?skip=0&show=300"
+    tags = ["cs.ai", "cs.cl", "cs.lg", "cs.se"]
+    urls = [template.format(tag=tag) for tag in tags]
+    prompt = f"""This is a collection of arxiv urls: '{urls}' .
+Record each article, remove duplicates by title (they may have multiple tags), filter out papers related to 
+large language model / agent / llm, print top 100 and visualize the word count of the titles"""
+    di = DataInterpreter(react_mode="react", tools=["scrape_web_playwright"])
+
+    await di.run(prompt)
+
+
+if __name__ == "__main__":
+    import asyncio
+
+    asyncio.run(main())
diff --git a/examples/di/custom_tool.py b/examples/di/custom_tool.py
new file mode 100644
index 0000000000..cbe7380c71
--- /dev/null
+++ b/examples/di/custom_tool.py
@@ -0,0 +1,36 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+"""
+@Time    : 2024/3/22 10:54
+@Author  : alexanderwu
+@File    : custom_tool.py
+"""
+
+from metagpt.roles.di.data_interpreter import DataInterpreter
+from metagpt.tools.tool_registry import register_tool
+
+
+@register_tool()
+def magic_function(arg1: str, arg2: int) -> dict:
+    """
+    The magic function that does something.
+
+    Args:
+        arg1 (str): ...
+        arg2 (int): ...
+
+    Returns:
+        dict: ...
+    """
+    return {"arg1": arg1 * 3, "arg2": arg2 * 5}
+
+
+async def main():
+    di = DataInterpreter(tools=["magic_function"])
+    await di.run("Just call the magic function with arg1 'A' and arg2 2. Tell me the result.")
+
+
+if __name__ == "__main__":
+    import asyncio
+
+    asyncio.run(main())
diff --git a/examples/di/data_visualization.py b/examples/di/data_visualization.py
index 1a21ab7cb9..184e04f266 100644
--- a/examples/di/data_visualization.py
+++ b/examples/di/data_visualization.py
@@ -1,14 +1,17 @@
 import asyncio
 
+from metagpt.logs import logger
 from metagpt.roles.di.data_interpreter import DataInterpreter
+from metagpt.utils.recovery_util import save_history
 
 
 async def main(requirement: str = ""):
     di = DataInterpreter()
-    await di.run(requirement)
+    rsp = await di.run(requirement)
+    logger.info(rsp)
+    save_history(role=di)
 
 
 if __name__ == "__main__":
     requirement = "Run data analysis on sklearn Iris dataset, include a plot"
-
     asyncio.run(main(requirement))
diff --git a/examples/rag_pipeline.py b/examples/rag_pipeline.py
new file mode 100644
index 0000000000..1687d556b2
--- /dev/null
+++ b/examples/rag_pipeline.py
@@ -0,0 +1,247 @@
+"""RAG pipeline"""
+
+import asyncio
+
+from pydantic import BaseModel
+
+from metagpt.const import DATA_PATH, EXAMPLE_DATA_PATH
+from metagpt.logs import logger
+from metagpt.rag.engines import SimpleEngine
+from metagpt.rag.schema import (
+    ChromaIndexConfig,
+    ChromaRetrieverConfig,
+    ElasticsearchIndexConfig,
+    ElasticsearchRetrieverConfig,
+    ElasticsearchStoreConfig,
+    FAISSRetrieverConfig,
+    LLMRankerConfig,
+)
+from metagpt.utils.exceptions import handle_exception
+
+DOC_PATH = EXAMPLE_DATA_PATH / "rag/writer.txt"
+QUESTION = "What are key qualities to be a good writer?"
+
+TRAVEL_DOC_PATH = EXAMPLE_DATA_PATH / "rag/travel.txt"
+TRAVEL_QUESTION = "What does Bob like?"
+
+LLM_TIP = "If you not sure, just answer I don't know."
+
+
+class Player(BaseModel):
+    """To demonstrate rag add objs."""
+
+    name: str = ""
+    goal: str = "Win The 100-meter Sprint."
+    tool: str = "Red Bull Energy Drink."
+
+    def rag_key(self) -> str:
+        """For search"""
+        return self.goal
+
+
+class RAGExample:
+    """Show how to use RAG."""
+
+    def __init__(self, engine: SimpleEngine = None):
+        self._engine = engine
+
+    @property
+    def engine(self):
+        if not self._engine:
+            self._engine = SimpleEngine.from_docs(
+                input_files=[DOC_PATH],
+                retriever_configs=[FAISSRetrieverConfig()],
+                ranker_configs=[LLMRankerConfig()],
+            )
+        return self._engine
+
+    @engine.setter
+    def engine(self, value: SimpleEngine):
+        self._engine = value
+
+    async def run_pipeline(self, question=QUESTION, print_title=True):
+        """This example run rag pipeline, use faiss retriever and llm ranker, will print something like:
+
+        Retrieve Result:
+        0. Productivi..., 10.0
+        1. I wrote cu..., 7.0
+        2. I highly r..., 5.0
+
+        Query Result:
+        Passion, adaptability, open-mindedness, creativity, discipline, and empathy are key qualities to be a good writer.
+        """
+        if print_title:
+            self._print_title("Run Pipeline")
+
+        nodes = await self.engine.aretrieve(question)
+        self._print_retrieve_result(nodes)
+
+        answer = await self.engine.aquery(question)
+        self._print_query_result(answer)
+
+    async def add_docs(self):
+        """This example show how to add docs.
+
+        Before add docs llm anwser I don't know.
+        After add docs llm give the correct answer, will print something like:
+
+        [Before add docs]
+        Retrieve Result:
+
+        Query Result:
+        Empty Response
+
+        [After add docs]
+        Retrieve Result:
+        0. Bob like..., 10.0
+
+        Query Result:
+        Bob likes traveling.
+        """
+        self._print_title("Add Docs")
+
+        travel_question = f"{TRAVEL_QUESTION}{LLM_TIP}"
+        travel_filepath = TRAVEL_DOC_PATH
+
+        logger.info("[Before add docs]")
+        await self.run_pipeline(question=travel_question, print_title=False)
+
+        logger.info("[After add docs]")
+        self.engine.add_docs([travel_filepath])
+        await self.run_pipeline(question=travel_question, print_title=False)
+
+    @handle_exception
+    async def add_objects(self, print_title=True):
+        """This example show how to add objects.
+
+        Before add docs, engine retrieve nothing.
+        After add objects, engine give the correct answer, will print something like:
+
+        [Before add objs]
+        Retrieve Result:
+
+        [After add objs]
+        Retrieve Result:
+        0. 100m Sprin..., 10.0
+
+        [Object Detail]
+        {'name': 'Mike', 'goal': 'Win The 100-meter Sprint', 'tool': 'Red Bull Energy Drink'}
+        """
+        if print_title:
+            self._print_title("Add Objects")
+
+        player = Player(name="Mike")
+        question = f"{player.rag_key()}"
+
+        logger.info("[Before add objs]")
+        await self._retrieve_and_print(question)
+
+        logger.info("[After add objs]")
+        self.engine.add_objs([player])
+
+        try:
+            nodes = await self._retrieve_and_print(question)
+
+            logger.info("[Object Detail]")
+            player: Player = nodes[0].metadata["obj"]
+            logger.info(player.name)
+        except Exception as e:
+            logger.error(f"nodes is empty, llm don't answer correctly, exception: {e}")
+
+    async def init_objects(self):
+        """This example show how to from objs, will print something like:
+
+        Same as add_objects.
+        """
+        self._print_title("Init Objects")
+
+        pre_engine = self.engine
+        self.engine = SimpleEngine.from_objs(retriever_configs=[FAISSRetrieverConfig()])
+        await self.add_objects(print_title=False)
+        self.engine = pre_engine
+
+    async def init_and_query_chromadb(self):
+        """This example show how to use chromadb. how to save and load index. will print something like:
+
+        Query Result:
+        Bob likes traveling.
+        """
+        self._print_title("Init And Query ChromaDB")
+
+        # 1. save index
+        output_dir = DATA_PATH / "rag"
+        SimpleEngine.from_docs(
+            input_files=[TRAVEL_DOC_PATH],
+            retriever_configs=[ChromaRetrieverConfig(persist_path=output_dir)],
+        )
+
+        # 2. load index
+        engine = SimpleEngine.from_index(index_config=ChromaIndexConfig(persist_path=output_dir))
+
+        # 3. query
+        answer = await engine.aquery(TRAVEL_QUESTION)
+        self._print_query_result(answer)
+
+    @handle_exception
+    async def init_and_query_es(self):
+        """This example show how to use es. how to save and load index. will print something like:
+
+        Query Result:
+        Bob likes traveling.
+        """
+        self._print_title("Init And Query Elasticsearch")
+
+        # 1. create es index and save docs
+        store_config = ElasticsearchStoreConfig(index_name="travel", es_url="http://127.0.0.1:9200")
+        engine = SimpleEngine.from_docs(
+            input_files=[TRAVEL_DOC_PATH],
+            retriever_configs=[ElasticsearchRetrieverConfig(store_config=store_config)],
+        )
+
+        # 2. load index
+        engine = SimpleEngine.from_index(index_config=ElasticsearchIndexConfig(store_config=store_config))
+
+        # 3. query
+        answer = await engine.aquery(TRAVEL_QUESTION)
+        self._print_query_result(answer)
+
+    @staticmethod
+    def _print_title(title):
+        logger.info(f"{'#'*30} {title} {'#'*30}")
+
+    @staticmethod
+    def _print_retrieve_result(result):
+        """Print retrieve result."""
+        logger.info("Retrieve Result:")
+
+        for i, node in enumerate(result):
+            logger.info(f"{i}. {node.text[:10]}..., {node.score}")
+
+        logger.info("")
+
+    @staticmethod
+    def _print_query_result(result):
+        """Print query result."""
+        logger.info("Query Result:")
+
+        logger.info(f"{result}\n")
+
+    async def _retrieve_and_print(self, question):
+        nodes = await self.engine.aretrieve(question)
+        self._print_retrieve_result(nodes)
+        return nodes
+
+
+async def main():
+    """RAG pipeline"""
+    e = RAGExample()
+    await e.run_pipeline()
+    await e.add_docs()
+    await e.add_objects()
+    await e.init_objects()
+    await e.init_and_query_chromadb()
+    await e.init_and_query_es()
+
+
+if __name__ == "__main__":
+    asyncio.run(main())
diff --git a/examples/rag_search.py b/examples/rag_search.py
new file mode 100644
index 0000000000..258c5ba60f
--- /dev/null
+++ b/examples/rag_search.py
@@ -0,0 +1,21 @@
+"""Agent with RAG search."""
+
+import asyncio
+
+from examples.rag_pipeline import DOC_PATH, QUESTION
+from metagpt.logs import logger
+from metagpt.rag.engines import SimpleEngine
+from metagpt.roles import Sales
+
+
+async def search():
+    """Agent with RAG search."""
+
+    store = SimpleEngine.from_docs(input_files=[DOC_PATH])
+    role = Sales(profile="Sales", store=store)
+    result = await role.run(QUESTION)
+    logger.info(result)
+
+
+if __name__ == "__main__":
+    asyncio.run(search())
diff --git a/examples/search_kb.py b/examples/search_kb.py
deleted file mode 100644
index 995720cc14..0000000000
--- a/examples/search_kb.py
+++ /dev/null
@@ -1,33 +0,0 @@
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-"""
-@File    : search_kb.py
-@Modified By: mashenquan, 2023-12-22. Delete useless codes.
-"""
-import asyncio
-
-from langchain.embeddings import OpenAIEmbeddings
-
-from metagpt.config2 import config
-from metagpt.const import DATA_PATH, EXAMPLE_PATH
-from metagpt.document_store import FaissStore
-from metagpt.logs import logger
-from metagpt.roles import Sales
-
-
-def get_store():
-    llm = config.get_openai_llm()
-    embedding = OpenAIEmbeddings(openai_api_key=llm.api_key, openai_api_base=llm.base_url)
-    return FaissStore(DATA_PATH / "example.json", embedding=embedding)
-
-
-async def search():
-    store = FaissStore(EXAMPLE_PATH / "example.json")
-    role = Sales(profile="Sales", store=store)
-    query = "Which facial cleanser is good for oily skin?"
-    result = await role.run(query)
-    logger.info(result)
-
-
-if __name__ == "__main__":
-    asyncio.run(search())
diff --git a/examples/search_with_specific_engine.py b/examples/search_with_specific_engine.py
index 1eee762d5a..276431ed85 100644
--- a/examples/search_with_specific_engine.py
+++ b/examples/search_with_specific_engine.py
@@ -13,7 +13,7 @@ async def main():
     question = "What are the most interesting human facts?"
 
     search = Config.default().search
-    kwargs = {"api_key": search.api_key, "cse_id": search.cse_id, "proxy": None}
+    kwargs = search.model_dump()
     await Searcher(search_engine=SearchEngine(engine=search.api_type, **kwargs)).run(question)
 
 
diff --git a/metagpt/environment/android_env/__init__.py b/examples/stanford_town/__init__.py
similarity index 100%
rename from metagpt/environment/android_env/__init__.py
rename to examples/stanford_town/__init__.py
diff --git a/examples/stanford_town/requirements.txt b/examples/stanford_town/requirements.txt
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/examples/stanford_town/run_st_game.py b/examples/stanford_town/run_st_game.py
new file mode 100644
index 0000000000..1a2d50f21e
--- /dev/null
+++ b/examples/stanford_town/run_st_game.py
@@ -0,0 +1,94 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : entry of Stanford Town(ST/st) game
+#           README see `metagpt/ext/stanford_town/README.md`
+
+import asyncio
+from typing import Optional
+
+import fire
+
+from metagpt.ext.stanford_town.roles.st_role import STRole
+from metagpt.ext.stanford_town.stanford_town import StanfordTown
+from metagpt.ext.stanford_town.utils.const import STORAGE_PATH
+from metagpt.ext.stanford_town.utils.mg_ga_transform import (
+    get_reverie_meta,
+    write_curr_sim_code,
+    write_curr_step,
+)
+from metagpt.ext.stanford_town.utils.utils import copy_folder
+from metagpt.logs import logger
+
+
+async def startup(
+    idea: str, fork_sim_code: str, sim_code: str, temp_storage_path: str, investment: float = 30.0, n_round: int = 500
+):
+    town = StanfordTown()
+    logger.info("StanfordTown init environment")
+
+    # copy `storage/{fork_sim_code}` to `storage/{sim_code}`
+    copy_folder(str(STORAGE_PATH.joinpath(fork_sim_code)), str(STORAGE_PATH.joinpath(sim_code)))
+
+    # get role names from `storage/{simulation_name}/reverie/meta.json` and then init roles
+    reverie_meta = get_reverie_meta(fork_sim_code)
+    roles = []
+    sim_path = STORAGE_PATH.joinpath(sim_code)
+    sim_path.mkdir(exist_ok=True)
+    for idx, role_name in enumerate(reverie_meta["persona_names"]):
+        has_inner_voice = True if idx == 0 else False
+        role = STRole(
+            name=role_name,
+            profile=role_name,
+            sim_code=sim_code,
+            step=reverie_meta.get("step", 0),
+            start_time=reverie_meta.get("start_date"),
+            curr_time=reverie_meta.get("curr_time"),
+            sec_per_step=reverie_meta.get("sec_per_step"),
+            has_inner_voice=has_inner_voice,
+        )
+        roles.append(role)
+
+    # init temp_storage
+    write_curr_sim_code({"sim_code": sim_code}, temp_storage_path)
+    write_curr_step({"step": reverie_meta.get("step", 0)}, temp_storage_path)
+
+    await town.hire(roles)
+
+    town.invest(investment)
+    town.run_project(idea)
+
+    await town.run(n_round)
+
+
+def main(
+    idea: str,
+    fork_sim_code: str,
+    sim_code: str,
+    temp_storage_path: Optional[str] = None,
+    investment: float = 30.0,
+    n_round: int = 500,
+):
+    """
+    Args:
+        idea: idea works as an `inner voice` to the first agent.
+        fork_sim_code: old simulation name to start with, choose one inside `generative_agents/environment/frontend_server/storage/`
+        sim_code: new simulation name to save simulation result
+        temp_storage_path: generative_agents temp_storage path inside `environment/frontend_server` to interact.
+        investment: the investment of running agents
+        n_round: rounds to run agents
+    """
+
+    asyncio.run(
+        startup(
+            idea=idea,
+            fork_sim_code=fork_sim_code,
+            sim_code=sim_code,
+            temp_storage_path=temp_storage_path,
+            investment=investment,
+            n_round=n_round,
+        )
+    )
+
+
+if __name__ == "__main__":
+    fire.Fire(main)
diff --git a/examples/stanford_town/storage/.gitignore b/examples/stanford_town/storage/.gitignore
new file mode 100644
index 0000000000..9628208614
--- /dev/null
+++ b/examples/stanford_town/storage/.gitignore
@@ -0,0 +1,4 @@
+# path to store simulation data
+test_*
+unittest*
+July*
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/environment/0.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/environment/0.json
new file mode 100644
index 0000000000..6eaa46c510
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/environment/0.json
@@ -0,0 +1,26 @@
+{
+  "Isabella Rodriguez": {
+    "maze": "the_ville",
+    "x": 72,
+    "y": 14
+  },
+  "Klaus Mueller": {
+    "maze": "the_ville",
+    "x": 126,
+    "y": 46
+  },
+  "Maria Lopez": {
+    "maze": "the_ville",
+    "x": 123,
+    "y": 57
+  }
+}
+
+
+
+
+
+
+
+
+
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory/embeddings.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory/embeddings.json
new file mode 100644
index 0000000000..9e26dfeeb6
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory/embeddings.json	
@@ -0,0 +1 @@
+{}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory/kw_strength.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory/kw_strength.json
new file mode 100644
index 0000000000..6dc73c1c85
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory/kw_strength.json	
@@ -0,0 +1,2 @@
+{"kw_strength_event": {},
+ "kw_strength_thought": {}}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory/nodes.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory/nodes.json
new file mode 100644
index 0000000000..9e26dfeeb6
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory/nodes.json	
@@ -0,0 +1 @@
+{}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/scratch.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/scratch.json
new file mode 100644
index 0000000000..dbed4b705e
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/scratch.json	
@@ -0,0 +1,51 @@
+{
+  "vision_r": 8, 
+  "att_bandwidth": 8, 
+  "retention": 8, 
+  "curr_time": null, 
+  "curr_tile": null, 
+  "daily_plan_req": "Isabella Rodriguez opens Hobbs Cafe at 8am everyday, and works at the counter until 8pm, at which point she closes the cafe.", 
+  "name": "Isabella Rodriguez", 
+  "first_name": "Isabella", 
+  "last_name": "Rodriguez", 
+  "age": 34, 
+  "innate": "friendly, outgoing, hospitable", 
+  "learned": "Isabella Rodriguez is a cafe owner of Hobbs Cafe who loves to make people feel welcome. She is always looking for ways to make the cafe a place where people can come to relax and enjoy themselves.", 
+  "currently": "Isabella Rodriguez is planning on having a Valentine's Day party at Hobbs Cafe with her customers on February 14th, 2023 at 5pm. She is gathering party material, and is telling everyone to join the party at Hobbs Cafe on February 14th, 2023, from 5pm to 7pm.", 
+  "lifestyle": "Isabella Rodriguez goes to bed around 11pm, awakes up around 6am.", 
+  "living_area": "the Ville:Isabella Rodriguez's apartment:main room",
+  "concept_forget": 100,
+  "daily_reflection_time": 180,
+  "daily_reflection_size": 5,
+  "overlap_reflect_th": 4,
+  "kw_strg_event_reflect_th": 10, 
+  "kw_strg_thought_reflect_th": 9, 
+
+  "recency_w": 1,
+  "relevance_w": 1,
+  "importance_w": 1,
+  "recency_decay": 0.995,
+  "importance_trigger_max": 150,
+  "importance_trigger_curr": 150,
+  "importance_ele_n": 0, 
+  "thought_count": 5, 
+
+  "daily_req": [], 
+  "f_daily_schedule": [],
+  "f_daily_schedule_hourly_org": [],
+  "act_address": null, 
+  "act_start_time": null, 
+  "act_duration": null, 
+  "act_description": null, 
+  "act_pronunciatio": null, 
+  "act_event": ["Isabella Rodriguez", null, null], 
+  "act_obj_description": null, 
+  "act_obj_pronunciatio": null, 
+  "act_obj_event": [null, null, null], 
+  "chatting_with": null, 
+  "chat": null,
+  "chatting_with_buffer": {}, 
+  "chatting_end_time": null,
+  "act_path_set": false, 
+  "planned_path": []
+}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/spatial_memory.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/spatial_memory.json
new file mode 100644
index 0000000000..f881579508
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/spatial_memory.json	
@@ -0,0 +1,66 @@
+{
+  "the Ville": {
+    "Hobbs Cafe": {
+      "cafe": [
+        "refrigerator",
+        "cafe customer seating",
+        "cooking area",
+        "kitchen sink",
+        "behind the cafe counter",
+        "piano"
+      ]
+    },
+    "Isabella Rodriguez's apartment": {
+      "main room": [
+        "bed",
+        "desk",
+        "refrigerator",
+        "closet",
+        "shelf"
+      ]
+    },
+    "The Rose and Crown Pub": {
+      "pub": [
+        "shelf",
+        "refrigerator",
+        "bar customer seating",
+        "behind the bar counter",
+        "kitchen sink",
+        "cooking area",
+        "microphone"
+      ]
+    },
+    "Harvey Oak Supply Store": {
+      "supply store": [
+        "supply store product shelf",
+        "behind the supply store counter",
+        "supply store counter"
+      ]
+    },
+    "The Willows Market and Pharmacy": {
+      "store": [
+        "behind the pharmacy counter",
+        "pharmacy store shelf",
+        "pharmacy store counter",
+        "grocery store shelf",
+        "behind the grocery counter",
+        "grocery store counter"
+      ]
+    },
+    "Dorm for Oak Hill College": {
+      "garden": [
+        "dorm garden"
+      ],
+      "common room": [
+        "common room sofa",
+        "pool table",
+        "common room table"
+      ]
+    },
+    "Johnson Park": {
+      "park": [
+        "park garden"
+      ]
+    }
+  }
+}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/associative_memory/embeddings.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/associative_memory/embeddings.json
new file mode 100644
index 0000000000..9e26dfeeb6
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/associative_memory/embeddings.json	
@@ -0,0 +1 @@
+{}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/associative_memory/kw_strength.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/associative_memory/kw_strength.json
new file mode 100644
index 0000000000..6dc73c1c85
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/associative_memory/kw_strength.json	
@@ -0,0 +1,2 @@
+{"kw_strength_event": {},
+ "kw_strength_thought": {}}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/associative_memory/nodes.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/associative_memory/nodes.json
new file mode 100644
index 0000000000..9e26dfeeb6
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/associative_memory/nodes.json	
@@ -0,0 +1 @@
+{}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/scratch.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/scratch.json
new file mode 100644
index 0000000000..7b0ce7d722
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/scratch.json	
@@ -0,0 +1,51 @@
+{
+  "vision_r": 8, 
+  "att_bandwidth": 8, 
+  "retention": 8, 
+  "curr_time": null, 
+  "curr_tile": null, 
+  "daily_plan_req": "Klaus Mueller goes to the library at Oak Hill College early in the morning, spends his days writing, and eats at Hobbs Cafe.", 
+  "name": "Klaus Mueller", 
+  "first_name": "Klaus", 
+  "last_name": "Mueller", 
+  "age": 20,
+  "innate": "kind, inquisitive, passionate", 
+  "learned": "Klaus Mueller is a student at Oak Hill College studying sociology. He is passionate about social justice and loves to explore different perspectives.", 
+  "currently": "Klaus Mueller is writing a research paper on the effects of gentrification in low-income communities.", 
+  "lifestyle": "Klaus Mueller goes to bed around 11pm, awakes up around 7am, eats dinner around 5pm.", 
+  "living_area": "the Ville:Dorm for Oak Hill College:Klaus Mueller's room",
+  "concept_forget": 100,
+  "daily_reflection_time": 180,
+  "daily_reflection_size": 5,
+  "overlap_reflect_th": 4,
+  "kw_strg_event_reflect_th": 10, 
+  "kw_strg_thought_reflect_th": 9, 
+
+  "recency_w": 1,
+  "relevance_w": 1,
+  "importance_w": 1,
+  "recency_decay": 0.99,
+  "importance_trigger_max": 150,
+  "importance_trigger_curr": 150,
+  "importance_ele_n": 0, 
+  "thought_count": 5, 
+  
+  "daily_req": [], 
+  "f_daily_schedule": [],
+  "f_daily_schedule_hourly_org": [],
+  "act_address": null, 
+  "act_start_time": null, 
+  "act_duration": null, 
+  "act_description": null, 
+  "act_pronunciatio": null, 
+  "act_event": ["Klaus Mueller", null, null], 
+  "act_obj_description": null, 
+  "act_obj_pronunciatio": null, 
+  "act_obj_event": [null, null, null], 
+  "chatting_with": null, 
+  "chat": null,
+  "chatting_with_buffer": {}, 
+  "chatting_end_time": null,
+  "act_path_set": false, 
+  "planned_path": []
+}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/spatial_memory.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/spatial_memory.json
new file mode 100644
index 0000000000..4f41686772
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/spatial_memory.json	
@@ -0,0 +1,86 @@
+{
+  "the Ville": {
+    "Oak Hill College": {
+      "hallway": [],
+      "library": [
+        "library sofa",
+        "library table",
+        "bookshelf"
+      ],
+      "classroom": [
+        "blackboard",
+        "classroom podium",
+        "classroom student seating"
+      ]
+    },
+    "Dorm for Oak Hill College": {
+      "garden": [
+        "dorm garden"
+      ],
+      "Klaus Mueller's room": [
+        "bed",
+        "game console",
+        "closet",
+        "desk"
+      ],
+      "woman's bathroom": [
+        "toilet",
+        "shower",
+        "bathroom sink"
+      ],
+      "common room": [
+        "common room sofa",
+        "pool table",
+        "common room table"
+      ],
+      "man's bathroom": [
+        "shower",
+        "bathroom sink",
+        "toilet"
+      ]
+    },
+    "The Willows Market and Pharmacy": {
+      "store": [
+        "grocery store shelf",
+        "behind the grocery counter",
+        "grocery store counter",
+        "pharmacy store shelf",
+        "pharmacy store counter",
+        "behind the pharmacy counter"
+      ]
+    },
+    "Harvey Oak Supply Store": {
+      "supply store": [
+        "supply store product shelf",
+        "behind the supply store counter",
+        "supply store counter"
+      ]
+    },
+    "Johnson Park": {
+      "park": [
+        "park garden"
+      ]
+    },
+    "The Rose and Crown Pub": {
+      "pub": [
+        "shelf",
+        "refrigerator",
+        "bar customer seating",
+        "behind the bar counter",
+        "kitchen sink",
+        "cooking area",
+        "microphone"
+      ]
+    },
+    "Hobbs Cafe": {
+      "cafe": [
+        "refrigerator",
+        "cafe customer seating",
+        "cooking area",
+        "kitchen sink",
+        "behind the cafe counter",
+        "piano"
+      ]
+    }
+  }
+}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/associative_memory/embeddings.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/associative_memory/embeddings.json
new file mode 100644
index 0000000000..9e26dfeeb6
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/associative_memory/embeddings.json	
@@ -0,0 +1 @@
+{}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/associative_memory/kw_strength.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/associative_memory/kw_strength.json
new file mode 100644
index 0000000000..6dc73c1c85
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/associative_memory/kw_strength.json	
@@ -0,0 +1,2 @@
+{"kw_strength_event": {},
+ "kw_strength_thought": {}}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/associative_memory/nodes.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/associative_memory/nodes.json
new file mode 100644
index 0000000000..9e26dfeeb6
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/associative_memory/nodes.json	
@@ -0,0 +1 @@
+{}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/scratch.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/scratch.json
new file mode 100644
index 0000000000..c3a304952d
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/scratch.json	
@@ -0,0 +1,51 @@
+{
+  "vision_r": 8, 
+  "att_bandwidth": 8, 
+  "retention": 8, 
+  "curr_time": null, 
+  "curr_tile": null, 
+  "daily_plan_req": "Maria Lopez spends at least 3 hours a day Twitch streaming or gaming.", 
+  "name": "Maria Lopez", 
+  "first_name": "Maria", 
+  "last_name": "Lopez", 
+  "age": 21,
+  "innate": "energetic, enthusiastic, inquisitive", 
+  "learned": "Maria Lopez is a student at Oak Hill College studying physics and a part time Twitch game streamer who loves to connect with people and explore new ideas.", 
+  "currently": "Maria Lopez is working on her physics degree and streaming games on Twitch to make some extra money. She visits Hobbs Cafe for studying and eating just about everyday.", 
+  "lifestyle": "Maria Lopez goes to bed around 2am, awakes up around 9am, eats dinner around 6pm. She likes to hang out at Hobbs Cafe if it's before 6pm.", 
+  "living_area": "the Ville:Dorm for Oak Hill College:Maria Lopez's room",
+  "concept_forget": 100,
+  "daily_reflection_time": 180,
+  "daily_reflection_size": 5,
+  "overlap_reflect_th": 4,
+  "kw_strg_event_reflect_th": 10, 
+  "kw_strg_thought_reflect_th": 9, 
+
+  "recency_w": 1,
+  "relevance_w": 1,
+  "importance_w": 1,
+  "recency_decay": 0.99,
+  "importance_trigger_max": 150,
+  "importance_trigger_curr": 150,
+  "importance_ele_n": 0, 
+  "thought_count": 5, 
+  
+  "daily_req": [], 
+  "f_daily_schedule": [],
+  "f_daily_schedule_hourly_org": [],
+  "act_address": null, 
+  "act_start_time": null, 
+  "act_duration": null, 
+  "act_description": null, 
+  "act_pronunciatio": null, 
+  "act_event": ["Maria Lopez", null, null], 
+  "act_obj_description": null, 
+  "act_obj_pronunciatio": null, 
+  "act_obj_event": [null, null, null], 
+  "chatting_with": null, 
+  "chat": null,
+  "chatting_with_buffer": {}, 
+  "chatting_end_time": null,
+  "act_path_set": false, 
+  "planned_path": []
+}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/spatial_memory.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/spatial_memory.json
new file mode 100644
index 0000000000..0a58212bda
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/spatial_memory.json	
@@ -0,0 +1,87 @@
+{
+  "the Ville": {
+    "Oak Hill College": {
+      "hallway": [],
+      "library": [
+        "library sofa",
+        "library table",
+        "bookshelf"
+      ],
+      "classroom": [
+        "blackboard",
+        "classroom podium",
+        "classroom student seating"
+      ]
+    },
+    "Dorm for Oak Hill College": {
+      "garden": [
+        "dorm garden"
+      ],
+      "Maria Lopez's room": [
+        "closet",
+        "desk",
+        "bed",
+        "computer",
+        "blackboard"
+      ],
+      "woman's bathroom": [
+        "toilet",
+        "shower",
+        "bathroom sink"
+      ],
+      "common room": [
+        "common room sofa",
+        "pool table",
+        "common room table"
+      ],
+      "man's bathroom": [
+        "shower",
+        "bathroom sink",
+        "toilet"
+      ]
+    },
+    "The Willows Market and Pharmacy": {
+      "store": [
+        "grocery store shelf",
+        "behind the grocery counter",
+        "grocery store counter",
+        "pharmacy store shelf",
+        "pharmacy store counter",
+        "behind the pharmacy counter"
+      ]
+    },
+    "Harvey Oak Supply Store": {
+      "supply store": [
+        "supply store product shelf",
+        "behind the supply store counter",
+        "supply store counter"
+      ]
+    },
+    "Johnson Park": {
+      "park": [
+        "park garden"
+      ]
+    },
+    "The Rose and Crown Pub": {
+      "pub": [
+        "shelf",
+        "refrigerator",
+        "bar customer seating",
+        "behind the bar counter",
+        "kitchen sink",
+        "cooking area",
+        "microphone"
+      ]
+    },
+    "Hobbs Cafe": {
+      "cafe": [
+        "refrigerator",
+        "cafe customer seating",
+        "cooking area",
+        "kitchen sink",
+        "behind the cafe counter",
+        "piano"
+      ]
+    }
+  }
+}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/reverie/meta.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/reverie/meta.json
new file mode 100644
index 0000000000..1e81ec12d2
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/reverie/meta.json
@@ -0,0 +1,13 @@
+{
+  "fork_sim_code": "base_the_ville_isabella_maria_klaus",
+  "start_date": "February 13, 2023",
+  "curr_time": "February 13, 2023, 00:00:00",
+  "sec_per_step": 10,
+  "maze_name": "the_ville",
+  "persona_names": [
+    "Isabella Rodriguez", 
+    "Maria Lopez",
+    "Klaus Mueller"    
+  ],
+  "step": 0
+}
\ No newline at end of file
diff --git a/examples/stream_output_via_api.py b/examples/stream_output_via_api.py
new file mode 100644
index 0000000000..5961f3a082
--- /dev/null
+++ b/examples/stream_output_via_api.py
@@ -0,0 +1,117 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+"""
+@Time    : 2024/3/27 9:44
+@Author  : leiwu30
+@File    : stream_output_via_api.py
+@Description    : Stream log information and communicate over the network via web api.
+"""
+import asyncio
+import json
+import socket
+import threading
+from contextvars import ContextVar
+
+from flask import Flask, Response, jsonify, request, send_from_directory
+
+from metagpt.const import TUTORIAL_PATH
+from metagpt.logs import logger, set_llm_stream_logfunc
+from metagpt.roles.tutorial_assistant import TutorialAssistant
+from metagpt.utils.stream_pipe import StreamPipe
+
+app = Flask(__name__)
+
+
+def stream_pipe_log(content):
+    print(content, end="")
+    stream_pipe = stream_pipe_var.get(None)
+    if stream_pipe:
+        stream_pipe.set_message(content)
+
+
+def write_tutorial(message):
+    async def main(idea, stream_pipe):
+        stream_pipe_var.set(stream_pipe)
+        role = TutorialAssistant()
+        await role.run(idea)
+
+    def thread_run(idea: str, stream_pipe: StreamPipe = None):
+        """
+        Convert asynchronous function to thread function
+        """
+        asyncio.run(main(idea, stream_pipe))
+
+    stream_pipe = StreamPipe()
+    thread = threading.Thread(
+        target=thread_run,
+        args=(
+            message["content"],
+            stream_pipe,
+        ),
+    )
+    thread.start()
+
+    while thread.is_alive():
+        msg = stream_pipe.get_message()
+        yield stream_pipe.msg2stream(msg)
+
+
+@app.route("/v1/chat/completions", methods=["POST"])
+def completions():
+    """
+    data: {
+        "model": "write_tutorial",
+        "stream": true,
+        "messages": [
+            {
+                "role": "user",
+                "content": "Write a tutorial about MySQL"
+            }
+        ]
+    }
+    """
+
+    data = json.loads(request.data)
+    logger.info(json.dumps(data, indent=4, ensure_ascii=False))
+
+    # Non-streaming interfaces are not supported yet
+    stream_type = True if data.get("stream") else False
+    if not stream_type:
+        return jsonify({"status": 400, "msg": "Non-streaming requests are not supported, please use `stream=True`."})
+
+    # Only accept the last user information
+    # openai['model'] ~ MetaGPT['agent']
+    last_message = data["messages"][-1]
+    model = data["model"]
+
+    # write_tutorial
+    if model == "write_tutorial":
+        return Response(write_tutorial(last_message), mimetype="text/plain")
+    else:
+        return jsonify({"status": 400, "msg": "No suitable agent found."})
+
+
+@app.route("/download/<path:filename>")
+def download_file(filename):
+    return send_from_directory(TUTORIAL_PATH, filename, as_attachment=True)
+
+
+if __name__ == "__main__":
+    """
+    curl https://$server_address:$server_port/v1/chat/completions -X POST -d '{
+        "model": "write_tutorial",
+        "stream": true,
+        "messages": [
+          {
+               "role": "user",
+               "content": "Write a tutorial about MySQL"
+          }
+        ]
+    }'
+    """
+    server_port = 7860
+    server_address = socket.gethostbyname(socket.gethostname())
+
+    set_llm_stream_logfunc(stream_pipe_log)
+    stream_pipe_var: ContextVar[StreamPipe] = ContextVar("stream_pipe")
+    app.run(port=server_port, host=server_address)
diff --git a/examples/werewolf_game/evals/eval.py b/examples/werewolf_game/evals/eval.py
new file mode 100644
index 0000000000..c890773de0
--- /dev/null
+++ b/examples/werewolf_game/evals/eval.py
@@ -0,0 +1,218 @@
+"""
+Filename: MetaGPT/examples/werewolf_game/evals/eval.py
+Created Date: Oct 18, 2023
+Updated Date: Oct 24, 2023
+Author: [Aria](https://github.com/ariafyy)
+Info: eval the Voting Accuracy Rate of non_werewolves and Vote Difficulity 
+"""
+
+import glob
+import os
+import re
+from pathlib import Path
+
+import numpy as np
+import pandas as pd
+from tqdm import tqdm
+from utils import Utils
+
+from metagpt.const import DEFAULT_WORKSPACE_ROOT, METAGPT_ROOT
+from metagpt.environment.werewolf.const import RoleType
+
+
+class Vote:
+    """Vote Evaluation"""
+
+    def __init__(self):
+        self.OUT_PATH = DEFAULT_WORKSPACE_ROOT / "outputs"
+        os.makedirs(self.OUT_PATH, exist_ok=True)
+        self.SUB_FOLDER_LIST = ["01-10", "11-20", "21-30"]
+
+    def _get_log_fileslist(self, IN_PATH) -> list[str]:
+        files_list = []
+        for SUB_FOLDER in self.SUB_FOLDER_LIST:
+            files_list.extend(glob.glob(str(IN_PATH / SUB_FOLDER / "*.txt")))
+        return files_list
+
+    def extract_votes_from_logs(self, files_list: list):
+        for in_logfile in tqdm(files_list):
+            SUB_FOLDER = (Path(in_logfile).parent).stem
+            out_txtfile = self.OUT_PATH / "# {0}_{1}.txt".format(SUB_FOLDER, Path(in_logfile).stem)
+            Utils().pick_vote_log(in_logfile, out_txtfile)
+        votefiles_list = Utils().get_file_list(self.OUT_PATH)
+        return votefiles_list
+
+    @staticmethod
+    def parse_vote_text2chunks(text: str):
+        """
+        parse each game vote log into text chunks
+
+        one chunk example:
+        ['Player1', 'Player2', 'Player3', 'Player5', 'Player6']. Say ONLY: I vote to eliminate ...
+        Player1(Witch): 49 | I vote to eliminate Player5
+        Player2(Villager): 49 | I vote to eliminate Player5
+        Player3(Villager): 49 | I vote to eliminate Player5
+        Player5(Werewolf): 49 | I vote to eliminate Player6
+        Player6(Seer): 49 | I vote to eliminate Player5
+        """
+        pattern = re.compile(r"""\[([^\]]+)\]. Say ONLY: I vote to eliminate ...""")
+        chunks = {}
+        chunk_id = 0
+        last_end = 0
+        for match in pattern.finditer(text):
+            start = match.start()
+            chunk = text[last_end:start]
+            chunks[f"vote_{chunk_id}"] = chunk.strip()
+            last_end = match.end()
+            chunk_id += 1
+        final_chunk = text[last_end:].strip()
+        if final_chunk:
+            chunks[f"vote_{chunk_id}"] = final_chunk
+        return chunks
+
+    def _vote_rate_players(self, text: str):
+        """
+        # calculate the rate of goodteam vote werewolves
+        :example:
+
+        input:
+        ['Player1', 'Player2', 'Player3', 'Player5', 'Player6']. Say ONLY: I vote to eliminate ...
+        Player1(Witch): 49 | I vote to eliminate Player5
+        Player2(Villager): 49 | I vote to eliminate Player5
+        Player3(Villager): 49 | I vote to eliminate Player5
+        Player5(Werewolf): 49 | I vote to eliminate Player6
+        Player6(Seer): 49 | I vote to eliminate Player5
+
+        output:
+        werewolves:  ['Player5']
+        non_werewolves: ['Player1', 'Player2', 'Player3', 'Player6']
+        as you can see :Player2(Villager) and   Player3(Villager) vote to eliminate Player5(Werewolf)
+        :return goodteam vote rateability: 100.00%
+        """
+        pattern = re.compile(r"(\w+)\(([^\)]+)\): \d+ \| I vote to eliminate (\w+)")
+        # find all werewolves
+        werewolves = []
+        for match in pattern.finditer(text):
+            if match.group(2) == RoleType.WEREWOLF.value:
+                werewolves.append(match.group(1))
+
+        # find all non_werewolves
+        non_werewolves = []
+        for match in pattern.finditer(text):
+            if match.group(2) != RoleType.WEREWOLF.value:
+                non_werewolves.append(match.group(1))
+        num_non_werewolves = len(non_werewolves)
+
+        # count players other than werewolves made the correct votes
+        correct_votes = 0
+        for match in pattern.finditer(text):
+            if match.group(2) != RoleType.WEREWOLF.value and match.group(3) in werewolves:
+                correct_votes += 1
+
+        # cal the rateability of non_werewolves
+        rate = correct_votes / num_non_werewolves
+        good_vote_rate = round(rate, 2)
+        return {"good_vote_rate": good_vote_rate, "werewolves": werewolves, "non_werewolves": non_werewolves}
+
+    def get_goodteam_vote_rate(self, text: str) -> float:
+        goodteam_vote_rate = self._vote_rate_players(text)["good_vote_rate"]
+        return goodteam_vote_rate
+
+    def get_werewolves(self, text: str) -> list:
+        werewolves_list = self._vote_rate_players(text)["werewolves"]
+        return werewolves_list
+
+    def get_non_werewolves(self, text: str) -> list:
+        non_werewolves_list = self._vote_rate_players(text)["non_werewolves"]
+        return non_werewolves_list
+
+    def get_votewolf_difficulty(self, werewolves: list, non_werewolves: list) -> str:
+        num_living_wolfs = len(werewolves)
+        num_living_players = len(werewolves) + len(non_werewolves)
+        votewolf_difficulty = "_{0} / {1}".format(num_living_wolfs, num_living_players)
+        return votewolf_difficulty
+
+    def get_result_df(self, out_txtfile: str) -> pd.DataFrame:
+        """
+        folder:  sub folders for evals
+        file: evaluation file, each file represents one game
+        votes: the number of votes, eg. vote_1 represents the first vote of this game,
+        good_vote_rate:the rateability of a good person voting against a werewolf,
+                   correct_votes / the total number of players other than werewolves
+        total_votes:the total number of votes cast
+        """
+        with open(out_txtfile, "r") as out_file:
+            text = out_file.read()
+            chunks = self.parse_vote_text2chunks(text)
+            res = []
+            for k, v in chunks.items():
+                if v != "":
+                    chunks_list = list(chunks.keys())
+                    total_votes = len(chunks_list) - 1
+                    werewolves = self.get_werewolves(v)
+                    non_werewolves = self.get_non_werewolves(v)
+                    good_vote_rate = self.get_goodteam_vote_rate(v)
+                    votewolf_difficulty = self.get_votewolf_difficulty(werewolves, non_werewolves)
+                    folder = Utils().filename_to_foldername(out_txtfile)
+                    result = {
+                        "folder": folder,
+                        "file": Path(out_txtfile).stem + ".txt",
+                        "vote_round": k,
+                        "good_vote_rate": good_vote_rate,
+                        "total_votes": total_votes,
+                        "votewolf_difficulty": votewolf_difficulty,
+                    }
+                    res.append(result)
+        df = pd.DataFrame(res)
+        return df
+
+    def calc_avg_rate(self, IN_PATH) -> pd.DataFrame:
+        """
+        get avg_rate for each game
+        avg_rate : the good_rate/total number of votes in the game
+        vote1_rate: First Round Voting Accuracy Rate
+        """
+        infiles_list = self._get_log_fileslist(IN_PATH)
+        votefiles_list = self.extract_votes_from_logs(infiles_list)
+        df_list = [self._load_df_from_file(file) for file in votefiles_list]
+        combined_df = pd.concat(df_list, ignore_index=True)
+        # calculate the average good_vote_rate for each file
+        mean_rates = self._calculate_mean_rates(combined_df)
+        combined_df["avg_rate"] = combined_df["file"].map(mean_rates)
+        # calculate vote1 rate
+        vote1_rates = self._calc_vote1_rates(combined_df)
+        combined_df["vote1_rate"] = combined_df["folder"].map(vote1_rates.set_index("folder")["good_vote_rate"])
+        combined_df.loc[combined_df["vote_round"] != "vote_1", "vote1_rate"] = np.nan
+        combined_df["vote1_rate"] = combined_df["vote1_rate"].apply(self._format_rates)
+        combined_df["good_vote_rate"] = combined_df["good_vote_rate"].apply(self._format_rates)
+        combined_df["avg_rate"] = combined_df["avg_rate"].apply(self._format_rates)
+        combined_df.sort_values(["file"], ascending=True, inplace=True)
+        return combined_df
+
+    def _calc_vote1_rates(self, df):
+        df_vote1 = df[df["vote_round"] == "vote_1"]
+        vote1_rates = df_vote1.groupby("folder")["good_vote_rate"].mean().reset_index()
+        return vote1_rates
+
+    def _load_df_from_file(self, file):
+        return self.get_result_df(file)
+
+    def _calculate_mean_rates(self, df):
+        return df.groupby("file")["good_vote_rate"].mean()
+
+    def _format_rates(self, s):
+        return Utils().float_to_percent(s)
+
+    def get_eval_csv(self, IN_PATH, EVAL_RESULT):
+        """
+        IN_PATH : parent folder of ["01-10", "11-20", "21-30"]
+        EVAL_RESULT : output csv file path
+        """
+        combined_df = self.calc_avg_rate(IN_PATH)
+        combined_df.to_csv(EVAL_RESULT, index=False)
+
+
+if __name__ == "__main__":
+    IN_PATH = METAGPT_ROOT / "examples/werewolf_game/evals"
+    EVAL_RESULT = DEFAULT_WORKSPACE_ROOT / "outputs" / "goodteam_vote_rate.csv"
+    Vote().get_eval_csv(IN_PATH, EVAL_RESULT)
diff --git a/examples/werewolf_game/evals/utils.py b/examples/werewolf_game/evals/utils.py
new file mode 100644
index 0000000000..490e7126fa
--- /dev/null
+++ b/examples/werewolf_game/evals/utils.py
@@ -0,0 +1,134 @@
+"""
+Filename: MetaGPT/examples/werewolf_game/evals/utils.py
+Created Date: Oct 11, 2023
+Revised Date: Oct 20, 2023
+Author: [Aria](https://github.com/ariafyy)
+"""
+import glob
+import os
+import re
+from pathlib import Path
+
+from metagpt.const import METAGPT_ROOT
+
+
+class Utils:
+    """Utils: utils of logs"""
+
+    @staticmethod
+    def polish_log(in_logfile, out_txtfile):
+        """polish logs for evaluation"""
+        pattern_text = r"(\d{4}-\d{2}-\d{2} \d{2}:\d{2}:\d{2}\.\d{3}) \| (\w+) +\| ([\w\.]+:\w+:\d+) - (.*\S)"
+        pattern_player = r"(Player(\d{1}): \w+)"
+        pattern_start = False
+        json_start = False
+
+        with open(in_logfile, "r") as f, open(out_txtfile, "w") as out:
+            for line in f.readlines():
+                matches = re.match(pattern_text, line)
+                if matches:
+                    message = matches.group(4).strip()
+                    pattern_start = True
+                    json_start = False
+
+                    if (
+                        "Moderator(Moderator) ready to InstructSpeak" not in message
+                        and "Moderator(Moderator) ready to ParseSpeak" not in message
+                        and "Total running cost:" not in message
+                    ):
+                        out.write("- " + message + "\n")
+                    else:
+                        out.write("\n")
+
+                elif pattern_start and not matches:
+                    if "gpt-4 may update over time" in line:
+                        line = ""
+                    out.write(line)
+
+                elif line.strip().startswith("{"):
+                    out.write(line.strip())
+                    json_start = True
+
+                elif json_start and not line.strip().endswith("}"):
+                    out.write(line.strip())
+
+                elif json_start and line.strip().endswith("}"):
+                    out.write(line.strip())
+                    json_start = False
+
+                elif (
+                    line.startswith("(User):") or line.startswith("********** STEP:") or re.search(pattern_player, line)
+                ):
+                    out.write(line)
+
+                else:
+                    out.write("\n")
+
+    @staticmethod
+    def pick_vote_log(in_logfile, out_txtfile):
+        """
+        pick the vote log from the log file.
+        ready to AnnounceGameResult serves as the 'HINT_TEXT ' which indicates the end of the game.
+        based on bservation and reflection, then discuss is not in vote session.
+        """
+        pattern_vote = r"(Player\d+)\(([A-Za-z]+)\): (\d+) \| (I vote to eliminate Player\d+)"
+        ignore_text = """reflection"""
+        HINT_TEXT = r"ready to AnnounceGameResult"
+        pattern_moderator = r"\[([^\]]+)\]\. Say ONLY: I vote to eliminate ..."
+        in_valid_block = False
+
+        with open(in_logfile, "r") as f:
+            lines = f.read()
+            split_lines = lines.split(HINT_TEXT)
+
+            if len(split_lines) < 2:
+                print(f"Key text :{HINT_TEXT} not found in {in_logfile}")
+                return
+
+            relevant_lines = split_lines[1].split("\n")
+            with open(out_txtfile, "w") as out:
+                for line in relevant_lines:
+                    if re.search(pattern_moderator, line):
+                        in_valid_block = True
+                        out.write(line.lstrip() + "\n")
+
+                    elif in_valid_block and re.search(pattern_vote, line):
+                        out.write(line + "\n")
+                    elif ignore_text in line:
+                        in_valid_block = False
+
+    @staticmethod
+    def get_file_list(path: str) -> list:
+        file_pattern = os.path.join(path, "*.txt")
+        files_list = glob.glob(file_pattern)
+        return files_list
+
+    @staticmethod
+    def filename_to_foldername(out_txtfile: str):
+        """
+        convert filename into its parent folder name
+        input:"....../# 01-10_10132100.txt"
+        output:# 01-10
+        """
+        s = Path(out_txtfile).stem
+        pattern_folder = r"([^_]*)_"
+        match = re.match(pattern_folder, s)
+        if match:
+            folder = match.group(1)
+            return folder
+
+    @staticmethod
+    def float_to_percent(decimal: float) -> str:
+        """
+        input:  1.00
+        output: 100.00%
+        """
+        percent = decimal * 100
+        return f"{percent:.2f}%"
+
+
+if __name__ == "__main__":
+    in_logfile = METAGPT_ROOT / "logs/log.txt"
+    out_txtfile = "input your wish path"
+    # Utils().polish_log(in_logfile, out_txtfile)
+    Utils().pick_vote_log(in_logfile, out_txtfile)
diff --git a/examples/werewolf_game/start_game.py b/examples/werewolf_game/start_game.py
new file mode 100644
index 0000000000..fe31c6c559
--- /dev/null
+++ b/examples/werewolf_game/start_game.py
@@ -0,0 +1,68 @@
+import asyncio
+
+import fire
+
+from metagpt.ext.werewolf.roles import Guard, Moderator, Seer, Villager, Werewolf, Witch
+from metagpt.ext.werewolf.roles.human_player import prepare_human_player
+from metagpt.ext.werewolf.werewolf_game import WerewolfGame
+from metagpt.logs import logger
+
+
+async def start_game(
+    investment: float = 3.0,
+    n_round: int = 5,
+    shuffle: bool = True,
+    add_human: bool = False,
+    use_reflection: bool = True,
+    use_experience: bool = False,
+    use_memory_selection: bool = False,
+    new_experience_version: str = "",
+):
+    game = WerewolfGame()
+    game_setup, players = game.env.init_game_setup(
+        role_uniq_objs=[Villager, Werewolf, Guard, Seer, Witch],
+        num_werewolf=2,
+        num_villager=2,
+        shuffle=shuffle,
+        add_human=add_human,
+        use_reflection=use_reflection,
+        use_experience=use_experience,
+        use_memory_selection=use_memory_selection,
+        new_experience_version=new_experience_version,
+        prepare_human_player=prepare_human_player,
+    )
+    logger.info(f"{game_setup}")
+
+    players = [Moderator()] + players
+    game.hire(players)
+    game.invest(investment)
+    game.run_project(game_setup)
+    await game.run(n_round=n_round)
+
+
+def main(
+    investment: float = 20.0,
+    n_round: int = 100,
+    shuffle: bool = True,
+    add_human: bool = False,
+    use_reflection: bool = True,
+    use_experience: bool = False,
+    use_memory_selection: bool = False,
+    new_experience_version: str = "",
+):
+    asyncio.run(
+        start_game(
+            investment,
+            n_round,
+            shuffle,
+            add_human,
+            use_reflection,
+            use_experience,
+            use_memory_selection,
+            new_experience_version,
+        )
+    )
+
+
+if __name__ == "__main__":
+    fire.Fire(main)
diff --git a/metagpt/actions/action_node.py b/metagpt/actions/action_node.py
index 09da4a9887..07638ce423 100644
--- a/metagpt/actions/action_node.py
+++ b/metagpt/actions/action_node.py
@@ -17,6 +17,7 @@
 from tenacity import retry, stop_after_attempt, wait_random_exponential
 
 from metagpt.actions.action_outcls_registry import register_action_outcls
+from metagpt.const import USE_CONFIG_TIMEOUT
 from metagpt.llm import BaseLLM
 from metagpt.logs import logger
 from metagpt.provider.postprocess.llm_output_postprocess import llm_output_postprocess
@@ -330,7 +331,7 @@ def keys(self, mode: str = "auto") -> list:
 
     def compile_to(self, i: Dict, schema, kv_sep) -> str:
         if schema == "json":
-            return json.dumps(i, indent=4)
+            return json.dumps(i, indent=4, ensure_ascii=False)
         elif schema == "markdown":
             return dict_to_markdown(i, kv_sep=kv_sep)
         else:
@@ -339,10 +340,7 @@ def compile_to(self, i: Dict, schema, kv_sep) -> str:
     def tagging(self, text, schema, tag="") -> str:
         if not tag:
             return text
-        if schema == "json":
-            return f"[{tag}]\n" + text + f"\n[/{tag}]"
-        else:  # markdown
-            return f"[{tag}]\n" + text + f"\n[/{tag}]"
+        return f"[{tag}]\n{text}\n[/{tag}]"
 
     def _compile_f(self, schema, mode, tag, format_func, kv_sep, exclude=None) -> str:
         nodes = self.to_dict(format_func=format_func, mode=mode, exclude=exclude)
@@ -374,7 +372,7 @@ def compile(self, context, schema="json", mode="children", template=SIMPLE_TEMPL
             schema="markdown": 编译context, example(markdown), instruction(markdown), constraint, action
         """
         if schema == "raw":
-            return context + "\n\n## Actions\n" + LANGUAGE_CONSTRAINT + "\n" + self.instruction
+            return f"{context}\n\n## Actions\n{LANGUAGE_CONSTRAINT}\n{self.instruction}"
 
         ### 直接使用 pydantic BaseModel 生成 instruction 与 example，仅限 JSON
         # child_class = self._create_children_class()
@@ -416,7 +414,7 @@ async def _aask_v1(
         images: Optional[Union[str, list[str]]] = None,
         system_msgs: Optional[list[str]] = None,
         schema="markdown",  # compatible to original format
-        timeout=3,
+        timeout=USE_CONFIG_TIMEOUT,
     ) -> (str, BaseModel):
         """Use ActionOutput to wrap the output of aask"""
         content = await self.llm.aask(prompt, system_msgs, images=images, timeout=timeout)
@@ -448,9 +446,10 @@ def set_llm(self, llm):
     def set_context(self, context):
         self.set_recursive("context", context)
 
-    async def simple_fill(self, schema, mode, images: Optional[Union[str, list[str]]] = None, timeout=3, exclude=None):
+    async def simple_fill(
+        self, schema, mode, images: Optional[Union[str, list[str]]] = None, timeout=USE_CONFIG_TIMEOUT, exclude=None
+    ):
         prompt = self.compile(context=self.context, schema=schema, mode=mode, exclude=exclude)
-
         if schema != "raw":
             mapping = self.get_mapping(mode, exclude=exclude)
             class_name = f"{self.key}_AN"
@@ -473,7 +472,7 @@ async def fill(
         mode="auto",
         strgy="simple",
         images: Optional[Union[str, list[str]]] = None,
-        timeout=3,
+        timeout=USE_CONFIG_TIMEOUT,
         exclude=[],
     ):
         """Fill the node(s) with mode.
diff --git a/metagpt/actions/di/write_analysis_code.py b/metagpt/actions/di/write_analysis_code.py
index 185926e311..711e56d39b 100644
--- a/metagpt/actions/di/write_analysis_code.py
+++ b/metagpt/actions/di/write_analysis_code.py
@@ -18,7 +18,7 @@
     STRUCTUAL_PROMPT,
 )
 from metagpt.schema import Message, Plan
-from metagpt.utils.common import CodeParser, process_message, remove_comments
+from metagpt.utils.common import CodeParser, remove_comments
 
 
 class WriteAnalysisCode(Action):
@@ -50,7 +50,7 @@ async def run(
         )
 
         working_memory = working_memory or []
-        context = process_message([Message(content=structual_prompt, role="user")] + working_memory)
+        context = self.llm.format_msg([Message(content=structual_prompt, role="user")] + working_memory)
 
         # LLM call
         if use_reflection:
diff --git a/metagpt/actions/rebuild_sequence_view.py b/metagpt/actions/rebuild_sequence_view.py
index 0e67de9086..2aac9bf203 100644
--- a/metagpt/actions/rebuild_sequence_view.py
+++ b/metagpt/actions/rebuild_sequence_view.py
@@ -486,7 +486,7 @@ def parse_participant(mermaid_sequence_diagram: str) -> List[str]:
         Returns:
             List[str]: A list of participants extracted from the sequence diagram.
         """
-        pattern = r"participant ([a-zA-Z\.0-9_]+)"
+        pattern = r"participant ([\w\.]+)"
         matches = re.findall(pattern, mermaid_sequence_diagram)
         matches = [re.sub(r"[\\/'\"]+", "", i) for i in matches]
         return matches
diff --git a/metagpt/actions/research.py b/metagpt/actions/research.py
index ce8d8a9677..2a99a8d99e 100644
--- a/metagpt/actions/research.py
+++ b/metagpt/actions/research.py
@@ -134,7 +134,7 @@ def gen_msg():
                     break
 
         model_name = config.llm.model
-        prompt = reduce_message_length(gen_msg(), model_name, system_text, 4096)
+        prompt = reduce_message_length(gen_msg(), model_name, system_text, config.llm.max_token)
         logger.debug(prompt)
         queries = await self._aask(prompt, [system_text])
         try:
diff --git a/metagpt/actions/write_code_plan_and_change_an.py b/metagpt/actions/write_code_plan_and_change_an.py
index f99bffd849..a909469816 100644
--- a/metagpt/actions/write_code_plan_and_change_an.py
+++ b/metagpt/actions/write_code_plan_and_change_an.py
@@ -128,6 +128,9 @@ def add_numbers():
 ## User New Requirements
 {requirement}
 
+## Issue
+{issue}
+
 ## PRD
 {prd}
 
@@ -211,7 +214,8 @@ async def run(self, *args, **kwargs):
         design_doc = await self.repo.docs.system_design.get(filename=self.i_context.design_filename)
         task_doc = await self.repo.docs.task.get(filename=self.i_context.task_filename)
         context = CODE_PLAN_AND_CHANGE_CONTEXT.format(
-            requirement=self.i_context.requirement,
+            requirement=f"```text\n{self.i_context.requirement}\n```",
+            issue=f"```text\n{self.i_context.issue}\n```",
             prd=prd_doc.content,
             design=design_doc.content,
             task=task_doc.content,
diff --git a/metagpt/actions/write_prd_an.py b/metagpt/actions/write_prd_an.py
index 5733b29da7..6a995e1840 100644
--- a/metagpt/actions/write_prd_an.py
+++ b/metagpt/actions/write_prd_an.py
@@ -133,10 +133,10 @@
 REFINED_REQUIREMENT_ANALYSIS = ActionNode(
     key="Refined Requirement Analysis",
     expected_type=List[str],
-    instruction="Review and refine the existing requirement analysis to align with the evolving needs of the project "
+    instruction="Review and refine the existing requirement analysis into a string list to align with the evolving needs of the project "
     "due to incremental development. Ensure the analysis comprehensively covers the new features and enhancements "
     "required for the refined project scope.",
-    example=["Require add/update/modify ..."],
+    example=["Require add ...", "Require modify ..."],
 )
 
 REQUIREMENT_POOL = ActionNode(
diff --git a/metagpt/config2.py b/metagpt/config2.py
index bc6af18c62..58a99c920b 100644
--- a/metagpt/config2.py
+++ b/metagpt/config2.py
@@ -12,6 +12,7 @@
 from pydantic import BaseModel, model_validator
 
 from metagpt.configs.browser_config import BrowserConfig
+from metagpt.configs.embedding_config import EmbeddingConfig
 from metagpt.configs.llm_config import LLMConfig, LLMType
 from metagpt.configs.mermaid_config import MermaidConfig
 from metagpt.configs.redis_config import RedisConfig
@@ -47,6 +48,9 @@ class Config(CLIParams, YamlModel):
     # Key Parameters
     llm: LLMConfig
 
+    # RAG Embedding
+    embedding: EmbeddingConfig = EmbeddingConfig()
+
     # Global Proxy. Will be used if llm.proxy is not set
     proxy: str = ""
 
@@ -75,6 +79,7 @@ class Config(CLIParams, YamlModel):
     iflytek_api_key: str = ""
     azure_tts_subscription_key: str = ""
     azure_tts_region: str = ""
+    _extra: dict = dict()  # extra config dict
 
     @classmethod
     def from_home(cls, path):
@@ -92,7 +97,7 @@ def default(cls):
         """
         default_config_paths: List[Path] = [
             METAGPT_ROOT / "config/config2.yaml",
-            Path.home() / ".metagpt/config2.yaml",
+            CONFIG_ROOT / "config2.yaml",
         ]
 
         dicts = [dict(os.environ)]
@@ -100,6 +105,20 @@ def default(cls):
         final = merge_dict(dicts)
         return Config(**final)
 
+    @classmethod
+    def from_llm_config(cls, llm_config: dict):
+        """user config llm
+        example:
+        llm_config = {"api_type": "xxx", "api_key": "xxx", "model": "xxx"}
+        gpt4 = Config.from_llm_config(llm_config)
+        A = Role(name="A", profile="Democratic candidate", goal="Win the election", actions=[a1], watch=[a2], config=gpt4)
+        """
+        llm_config = LLMConfig.model_validate(llm_config)
+        dicts = [dict(os.environ)]
+        dicts += [{"llm": llm_config}]
+        final = merge_dict(dicts)
+        return Config(**final)
+
     def update_via_cli(self, project_path, project_name, inc, reqa_file, max_auto_summarize_code):
         """update config via cli"""
 
@@ -113,6 +132,14 @@ def update_via_cli(self, project_path, project_name, inc, reqa_file, max_auto_su
         self.reqa_file = reqa_file
         self.max_auto_summarize_code = max_auto_summarize_code
 
+    @property
+    def extra(self):
+        return self._extra
+
+    @extra.setter
+    def extra(self, value: dict):
+        self._extra = value
+
     def get_openai_llm(self) -> Optional[LLMConfig]:
         """Get OpenAI LLMConfig by name. If no OpenAI, raise Exception"""
         if self.llm.api_type == LLMType.OPENAI:
diff --git a/metagpt/configs/embedding_config.py b/metagpt/configs/embedding_config.py
new file mode 100644
index 0000000000..20de479996
--- /dev/null
+++ b/metagpt/configs/embedding_config.py
@@ -0,0 +1,50 @@
+from enum import Enum
+from typing import Optional
+
+from pydantic import field_validator
+
+from metagpt.utils.yaml_model import YamlModel
+
+
+class EmbeddingType(Enum):
+    OPENAI = "openai"
+    AZURE = "azure"
+    GEMINI = "gemini"
+    OLLAMA = "ollama"
+
+
+class EmbeddingConfig(YamlModel):
+    """Config for Embedding.
+
+    Examples:
+    ---------
+    api_type: "openai"
+    api_key: "YOU_API_KEY"
+
+    api_type: "azure"
+    api_key: "YOU_API_KEY"
+    base_url: "YOU_BASE_URL"
+    api_version: "YOU_API_VERSION"
+
+    api_type: "gemini"
+    api_key: "YOU_API_KEY"
+
+    api_type: "ollama"
+    base_url: "YOU_BASE_URL"
+    model: "YOU_MODEL"
+    """
+
+    api_type: Optional[EmbeddingType] = None
+    api_key: Optional[str] = None
+    base_url: Optional[str] = None
+    api_version: Optional[str] = None
+
+    model: Optional[str] = None
+    embed_batch_size: Optional[int] = None
+
+    @field_validator("api_type", mode="before")
+    @classmethod
+    def check_api_type(cls, v):
+        if v == "":
+            return None
+        return v
diff --git a/metagpt/configs/llm_config.py b/metagpt/configs/llm_config.py
index 77bfc8466a..af8f56372f 100644
--- a/metagpt/configs/llm_config.py
+++ b/metagpt/configs/llm_config.py
@@ -10,6 +10,7 @@
 
 from pydantic import field_validator
 
+from metagpt.const import LLM_API_TIMEOUT
 from metagpt.utils.yaml_model import YamlModel
 
 
@@ -29,6 +30,7 @@ class LLMType(Enum):
     DASHSCOPE = "dashscope"  # Aliyun LingJi DashScope
     MOONSHOT = "moonshot"
     MISTRAL = "mistral"
+    YI = "yi"  # lingyiwanwu
 
     def __missing__(self, key):
         return self.OPENAI
@@ -73,7 +75,7 @@ class LLMConfig(YamlModel):
     stream: bool = False
     logprobs: Optional[bool] = None  # https://cookbook.openai.com/examples/using_logprobs
     top_logprobs: Optional[int] = None
-    timeout: int = 60
+    timeout: int = 600
 
     # For Network
     proxy: Optional[str] = None
@@ -87,3 +89,8 @@ def check_llm_key(cls, v):
         if v in ["", None, "YOUR_API_KEY"]:
             raise ValueError("Please set your API key in config2.yaml")
         return v
+
+    @field_validator("timeout")
+    @classmethod
+    def check_timeout(cls, v):
+        return v or LLM_API_TIMEOUT
diff --git a/metagpt/configs/mermaid_config.py b/metagpt/configs/mermaid_config.py
index 50c8a18475..47f14f4cd0 100644
--- a/metagpt/configs/mermaid_config.py
+++ b/metagpt/configs/mermaid_config.py
@@ -13,7 +13,7 @@
 class MermaidConfig(YamlModel):
     """Config for Mermaid"""
 
-    engine: Literal["nodejs", "ink", "playwright", "pyppeteer"] = "nodejs"
+    engine: Literal["nodejs", "ink", "playwright", "pyppeteer", "none"] = "nodejs"
     path: str = "mmdc"  # mmdc
     puppeteer_config: str = ""
     pyppeteer_path: str = "/usr/bin/google-chrome-stable"
diff --git a/metagpt/configs/search_config.py b/metagpt/configs/search_config.py
index af928b02a1..e28b14c994 100644
--- a/metagpt/configs/search_config.py
+++ b/metagpt/configs/search_config.py
@@ -7,6 +7,8 @@
 """
 from typing import Callable, Optional
 
+from pydantic import Field
+
 from metagpt.tools import SearchEngineType
 from metagpt.utils.yaml_model import YamlModel
 
@@ -18,3 +20,11 @@ class SearchConfig(YamlModel):
     api_key: str = ""
     cse_id: str = ""  # for google
     search_func: Optional[Callable] = None
+    params: dict = Field(
+        default_factory=lambda: {
+            "engine": "google",
+            "google_domain": "google.com",
+            "gl": "us",
+            "hl": "en",
+        }
+    )
diff --git a/metagpt/const.py b/metagpt/const.py
index a5e3ea9c2f..e4cebfd96c 100644
--- a/metagpt/const.py
+++ b/metagpt/const.py
@@ -49,6 +49,7 @@ def get_metagpt_root():
 DEFAULT_WORKSPACE_ROOT = METAGPT_ROOT / "workspace"
 
 EXAMPLE_PATH = METAGPT_ROOT / "examples"
+EXAMPLE_DATA_PATH = EXAMPLE_PATH / "data"
 DATA_PATH = METAGPT_ROOT / "data"
 TEST_DATA_PATH = METAGPT_ROOT / "tests/data"
 RESEARCH_PATH = DATA_PATH / "research"
@@ -122,7 +123,6 @@ def get_metagpt_root():
 
 # REDIS
 REDIS_KEY = "REDIS_KEY"
-LLM_API_TIMEOUT = 300
 
 # Message id
 IGNORED_MESSAGE_ID = "0"
@@ -131,3 +131,7 @@ def get_metagpt_root():
 GENERALIZATION = "Generalize"
 COMPOSITION = "Composite"
 AGGREGATION = "Aggregate"
+
+# Timeout
+USE_CONFIG_TIMEOUT = 0  # Using llm.timeout configuration.
+LLM_API_TIMEOUT = 300
diff --git a/metagpt/context.py b/metagpt/context.py
index 0add4c71ae..2bd5412026 100644
--- a/metagpt/context.py
+++ b/metagpt/context.py
@@ -7,7 +7,7 @@
 """
 import os
 from pathlib import Path
-from typing import Any, Optional
+from typing import Any, Dict, Optional
 
 from pydantic import BaseModel, ConfigDict
 
@@ -78,12 +78,6 @@ def new_environ(self):
         # env.update({k: v for k, v in i.items() if isinstance(v, str)})
         return env
 
-    # def use_llm(self, name: Optional[str] = None, provider: LLMType = LLMType.OPENAI) -> BaseLLM:
-    #     """Use a LLM instance"""
-    #     self._llm_config = self.config.get_llm_config(name, provider)
-    #     self._llm = None
-    #     return self._llm
-
     def _select_costmanager(self, llm_config: LLMConfig) -> CostManager:
         """Return a CostManager instance"""
         if llm_config.api_type == LLMType.FIREWORKS:
@@ -108,3 +102,38 @@ def llm_with_cost_manager_from_llm_config(self, llm_config: LLMConfig) -> BaseLL
         if llm.cost_manager is None:
             llm.cost_manager = self._select_costmanager(llm_config)
         return llm
+
+    def serialize(self) -> Dict[str, Any]:
+        """Serialize the object's attributes into a dictionary.
+
+        Returns:
+            Dict[str, Any]: A dictionary containing serialized data.
+        """
+        return {
+            "workdir": str(self.repo.workdir) if self.repo else "",
+            "kwargs": {k: v for k, v in self.kwargs.__dict__.items()},
+            "cost_manager": self.cost_manager.model_dump_json(),
+        }
+
+    def deserialize(self, serialized_data: Dict[str, Any]):
+        """Deserialize the given serialized data and update the object's attributes accordingly.
+
+        Args:
+            serialized_data (Dict[str, Any]): A dictionary containing serialized data.
+        """
+        if not serialized_data:
+            return
+        workdir = serialized_data.get("workdir")
+        if workdir:
+            self.git_repo = GitRepository(local_path=workdir, auto_init=True)
+            self.repo = ProjectRepo(self.git_repo)
+            src_workspace = self.git_repo.workdir / self.git_repo.workdir.name
+            if src_workspace.exists():
+                self.src_workspace = src_workspace
+        kwargs = serialized_data.get("kwargs")
+        if kwargs:
+            for k, v in kwargs.items():
+                self.kwargs.set(k, v)
+        cost_manager = serialized_data.get("cost_manager")
+        if cost_manager:
+            self.cost_manager.model_validate_json(cost_manager)
diff --git a/metagpt/document.py b/metagpt/document.py
index 1a3c4b2f8b..4a8bb68d5c 100644
--- a/metagpt/document.py
+++ b/metagpt/document.py
@@ -11,12 +11,9 @@
 from typing import Optional, Union
 
 import pandas as pd
-from langchain.text_splitter import CharacterTextSplitter
-from langchain_community.document_loaders import (
-    TextLoader,
-    UnstructuredPDFLoader,
-    UnstructuredWordDocumentLoader,
-)
+from llama_index.core import Document, SimpleDirectoryReader
+from llama_index.core.node_parser import SimpleNodeParser
+from llama_index.readers.file import PDFReader
 from pydantic import BaseModel, ConfigDict, Field
 from tqdm import tqdm
 
@@ -29,7 +26,7 @@ def validate_cols(content_col: str, df: pd.DataFrame):
         raise ValueError("Content column not found in DataFrame.")
 
 
-def read_data(data_path: Path):
+def read_data(data_path: Path) -> Union[pd.DataFrame, list[Document]]:
     suffix = data_path.suffix
     if ".xlsx" == suffix:
         data = pd.read_excel(data_path)
@@ -38,14 +35,13 @@ def read_data(data_path: Path):
     elif ".json" == suffix:
         data = pd.read_json(data_path)
     elif suffix in (".docx", ".doc"):
-        data = UnstructuredWordDocumentLoader(str(data_path), mode="elements").load()
+        data = SimpleDirectoryReader(input_files=[str(data_path)]).load_data()
     elif ".txt" == suffix:
-        data = TextLoader(str(data_path)).load()
-        text_splitter = CharacterTextSplitter(separator="\n", chunk_size=256, chunk_overlap=0)
-        texts = text_splitter.split_documents(data)
-        data = texts
+        data = SimpleDirectoryReader(input_files=[str(data_path)]).load_data()
+        node_parser = SimpleNodeParser.from_defaults(separator="\n", chunk_size=256, chunk_overlap=0)
+        data = node_parser.get_nodes_from_documents(data)
     elif ".pdf" == suffix:
-        data = UnstructuredPDFLoader(str(data_path), mode="elements").load()
+        data = PDFReader.load_data(str(data_path))
     else:
         raise NotImplementedError("File format not supported.")
     return data
@@ -150,9 +146,9 @@ def _get_docs_and_metadatas_by_df(self) -> (list, list):
                 metadatas.append({})
         return docs, metadatas
 
-    def _get_docs_and_metadatas_by_langchain(self) -> (list, list):
+    def _get_docs_and_metadatas_by_llamaindex(self) -> (list, list):
         data = self.data
-        docs = [i.page_content for i in data]
+        docs = [i.text for i in data]
         metadatas = [i.metadata for i in data]
         return docs, metadatas
 
@@ -160,7 +156,7 @@ def get_docs_and_metadatas(self) -> (list, list):
         if isinstance(self.data, pd.DataFrame):
             return self._get_docs_and_metadatas_by_df()
         elif isinstance(self.data, list):
-            return self._get_docs_and_metadatas_by_langchain()
+            return self._get_docs_and_metadatas_by_llamaindex()
         else:
             raise NotImplementedError("Data type not supported for metadata extraction.")
 
diff --git a/metagpt/document_store/base_store.py b/metagpt/document_store/base_store.py
index ddc1d626b0..6aafc57bb0 100644
--- a/metagpt/document_store/base_store.py
+++ b/metagpt/document_store/base_store.py
@@ -38,9 +38,9 @@ def __init__(self, raw_data_path: Path, cache_dir: Path = None):
         if not self.store:
             self.store = self.write()
 
-    def _get_index_and_store_fname(self, index_ext=".index", pkl_ext=".pkl"):
-        index_file = self.cache_dir / f"{self.fname}{index_ext}"
-        store_file = self.cache_dir / f"{self.fname}{pkl_ext}"
+    def _get_index_and_store_fname(self, index_ext=".json", docstore_ext=".json"):
+        index_file = self.cache_dir / "default__vector_store" / index_ext
+        store_file = self.cache_dir / "docstore" / docstore_ext
         return index_file, store_file
 
     @abstractmethod
diff --git a/metagpt/document_store/chromadb_store.py b/metagpt/document_store/chromadb_store.py
index d7344d41ba..1d3a014ee6 100644
--- a/metagpt/document_store/chromadb_store.py
+++ b/metagpt/document_store/chromadb_store.py
@@ -11,9 +11,9 @@
 class ChromaStore:
     """If inherited from BaseStore, or importing other modules from metagpt, a Python exception occurs, which is strange."""
 
-    def __init__(self, name):
+    def __init__(self, name: str, get_or_create: bool = False):
         client = chromadb.Client()
-        collection = client.create_collection(name)
+        collection = client.create_collection(name, get_or_create=get_or_create)
         self.client = client
         self.collection = collection
 
diff --git a/metagpt/document_store/faiss_store.py b/metagpt/document_store/faiss_store.py
index 2359917d5d..b196bef270 100644
--- a/metagpt/document_store/faiss_store.py
+++ b/metagpt/document_store/faiss_store.py
@@ -7,10 +7,14 @@
 """
 import asyncio
 from pathlib import Path
-from typing import Optional
+from typing import Any, Optional
 
-from langchain.vectorstores import FAISS
-from langchain_core.embeddings import Embeddings
+import faiss
+from llama_index.core import VectorStoreIndex, load_index_from_storage
+from llama_index.core.embeddings import BaseEmbedding
+from llama_index.core.schema import Document, QueryBundle, TextNode
+from llama_index.core.storage import StorageContext
+from llama_index.vector_stores.faiss import FaissVectorStore
 
 from metagpt.document import IndexableDocument
 from metagpt.document_store.base_store import LocalStore
@@ -20,36 +24,50 @@
 
 class FaissStore(LocalStore):
     def __init__(
-        self, raw_data: Path, cache_dir=None, meta_col="source", content_col="output", embedding: Embeddings = None
+        self, raw_data: Path, cache_dir=None, meta_col="source", content_col="output", embedding: BaseEmbedding = None
     ):
         self.meta_col = meta_col
         self.content_col = content_col
         self.embedding = embedding or get_embedding()
+        self.store: VectorStoreIndex
         super().__init__(raw_data, cache_dir)
 
-    def _load(self) -> Optional["FaissStore"]:
-        index_file, store_file = self._get_index_and_store_fname(index_ext=".faiss")  # langchain FAISS using .faiss
+    def _load(self) -> Optional["VectorStoreIndex"]:
+        index_file, store_file = self._get_index_and_store_fname()
 
         if not (index_file.exists() and store_file.exists()):
             logger.info("Missing at least one of index_file/store_file, load failed and return None")
             return None
+        vector_store = FaissVectorStore.from_persist_dir(persist_dir=self.cache_dir)
+        storage_context = StorageContext.from_defaults(persist_dir=self.cache_dir, vector_store=vector_store)
+        index = load_index_from_storage(storage_context, embed_model=self.embedding)
 
-        return FAISS.load_local(self.raw_data_path.parent, self.embedding, self.fname)
+        return index
 
-    def _write(self, docs, metadatas):
-        store = FAISS.from_texts(docs, self.embedding, metadatas=metadatas)
-        return store
+    def _write(self, docs: list[str], metadatas: list[dict[str, Any]]) -> VectorStoreIndex:
+        assert len(docs) == len(metadatas)
+        documents = [Document(text=doc, metadata=metadatas[idx]) for idx, doc in enumerate(docs)]
+
+        vector_store = FaissVectorStore(faiss_index=faiss.IndexFlatL2(1536))
+        storage_context = StorageContext.from_defaults(vector_store=vector_store)
+        index = VectorStoreIndex.from_documents(
+            documents=documents, storage_context=storage_context, embed_model=self.embedding
+        )
+
+        return index
 
     def persist(self):
-        self.store.save_local(self.raw_data_path.parent, self.fname)
+        self.store.storage_context.persist(self.cache_dir)
+
+    def search(self, query: str, expand_cols=False, sep="\n", *args, k=5, **kwargs):
+        retriever = self.store.as_retriever(similarity_top_k=k)
+        rsp = retriever.retrieve(QueryBundle(query_str=query, embedding=self.embedding.get_text_embedding(query)))
 
-    def search(self, query, expand_cols=False, sep="\n", *args, k=5, **kwargs):
-        rsp = self.store.similarity_search(query, k=k, **kwargs)
         logger.debug(rsp)
         if expand_cols:
-            return str(sep.join([f"{x.page_content}: {x.metadata}" for x in rsp]))
+            return str(sep.join([f"{x.node.text}: {x.node.metadata}" for x in rsp]))
         else:
-            return str(sep.join([f"{x.page_content}" for x in rsp]))
+            return str(sep.join([f"{x.node.text}" for x in rsp]))
 
     async def asearch(self, *args, **kwargs):
         return await asyncio.to_thread(self.search, *args, **kwargs)
@@ -67,8 +85,12 @@ def write(self):
 
     def add(self, texts: list[str], *args, **kwargs) -> list[str]:
         """FIXME: Currently, the store is not updated after adding."""
-        return self.store.add_texts(texts)
+        texts_embeds = self.embedding.get_text_embedding_batch(texts)
+        nodes = [TextNode(text=texts[idx], embedding=embed) for idx, embed in enumerate(texts_embeds)]
+        self.store.insert_nodes(nodes)
+
+        return []
 
     def delete(self, *args, **kwargs):
-        """Currently, langchain does not provide a delete interface."""
+        """Currently, faiss does not provide a delete interface."""
         raise NotImplementedError
diff --git a/metagpt/environment/README.md b/metagpt/environment/README.md
index 9476ac75ac..bb7d50d501 100644
--- a/metagpt/environment/README.md
+++ b/metagpt/environment/README.md
@@ -21,7 +21,7 @@ observe & step inside role's actions
 from metagpt.environment.api.env_api import EnvAPIAbstract
 
 # get screenshot from ExtEnv
-screenshot_path: Path = env.observe(
+screenshot_path: Path = await env.observe(
             EnvAPIAbstract(
                 api_name="get_screenshot", kwargs={"ss_name": f"{round_count}_before", "local_save_dir": task_dir}
             )
@@ -34,5 +34,5 @@ res = env.step(EnvAPIAbstract("system_tap", kwargs={"x": x, "y": y}))
 ## TODO
 - add android app operation assistant under `examples/android_assistant`
 - migrate roles/actions of werewolf game from old version into current version
-- migrate roles/actions of mincraft game from old version into current version
+- migrate roles/actions of minecraft game from old version into current version
 - migrate roles/actions of stanford_town game from old version into current version
diff --git a/metagpt/environment/__init__.py b/metagpt/environment/__init__.py
index 692672fa7d..0621fff165 100644
--- a/metagpt/environment/__init__.py
+++ b/metagpt/environment/__init__.py
@@ -3,11 +3,10 @@
 # @Desc   :
 
 from metagpt.environment.base_env import Environment
-from metagpt.environment.android_env.android_env import AndroidEnv
-from metagpt.environment.mincraft_env.mincraft_env import MincraftExtEnv
-from metagpt.environment.werewolf_env.werewolf_env import WerewolfEnv
-from metagpt.environment.stanford_town_env.stanford_town_env import StanfordTownEnv
-from metagpt.environment.software_env.software_env import SoftwareEnv
+from metagpt.environment.android.android_env import AndroidEnv
+from metagpt.environment.werewolf.werewolf_env import WerewolfEnv
+from metagpt.environment.stanford_town.stanford_town_env import StanfordTownEnv
+from metagpt.environment.software.software_env import SoftwareEnv
 
 
-__all__ = ["AndroidEnv", "MincraftExtEnv", "WerewolfEnv", "StanfordTownEnv", "SoftwareEnv", "Environment"]
+__all__ = ["AndroidEnv", "WerewolfEnv", "StanfordTownEnv", "SoftwareEnv", "Environment"]
diff --git a/metagpt/environment/mincraft_env/__init__.py b/metagpt/environment/android/__init__.py
similarity index 100%
rename from metagpt/environment/mincraft_env/__init__.py
rename to metagpt/environment/android/__init__.py
diff --git a/metagpt/environment/android_env/android_env.py b/metagpt/environment/android/android_env.py
similarity index 59%
rename from metagpt/environment/android_env/android_env.py
rename to metagpt/environment/android/android_env.py
index c27e20541e..66672d219e 100644
--- a/metagpt/environment/android_env/android_env.py
+++ b/metagpt/environment/android/android_env.py
@@ -4,10 +4,12 @@
 
 from pydantic import Field
 
-from metagpt.environment.android_env.android_ext_env import AndroidExtEnv
+from metagpt.environment.android.android_ext_env import AndroidExtEnv
 from metagpt.environment.base_env import Environment
 
 
-class AndroidEnv(Environment, AndroidExtEnv):
+class AndroidEnv(AndroidExtEnv, Environment):
+    """in order to use actual `reset`&`observe`, inherited order: AndroidExtEnv, Environment"""
+
     rows: int = Field(default=0, description="rows of a grid on the screenshot")
     cols: int = Field(default=0, description="cols of a grid on the screenshot")
diff --git a/metagpt/environment/android_env/android_ext_env.py b/metagpt/environment/android/android_ext_env.py
similarity index 66%
rename from metagpt/environment/android_env/android_ext_env.py
rename to metagpt/environment/android/android_ext_env.py
index b81b2cd262..826846e4fb 100644
--- a/metagpt/environment/android_env/android_ext_env.py
+++ b/metagpt/environment/android/android_ext_env.py
@@ -8,7 +8,14 @@
 
 from pydantic import Field
 
-from metagpt.environment.android_env.const import ADB_EXEC_FAIL
+from metagpt.environment.android.const import ADB_EXEC_FAIL
+from metagpt.environment.android.env_space import (
+    EnvAction,
+    EnvActionType,
+    EnvObsParams,
+    EnvObsType,
+    EnvObsValType,
+)
 from metagpt.environment.base_env import ExtEnv, mark_as_readable, mark_as_writeable
 
 
@@ -21,11 +28,70 @@ class AndroidExtEnv(ExtEnv):
 
     def __init__(self, **data: Any):
         super().__init__(**data)
-        if data.get("device_id"):
+        device_id = data.get("device_id")
+        if device_id:
+            devices = self.list_devices()
+            if device_id not in devices:
+                raise RuntimeError(f"device-id: {device_id} not found")
             (width, height) = self.device_shape
             self.width = data.get("width", width)
             self.height = data.get("height", height)
 
+            self.create_device_path(self.screenshot_dir)
+            self.create_device_path(self.xml_dir)
+
+    def reset(
+        self,
+        *,
+        seed: Optional[int] = None,
+        options: Optional[dict[str, Any]] = None,
+    ) -> tuple[dict[str, Any], dict[str, Any]]:
+        super().reset(seed=seed, options=options)
+
+        obs = self._get_obs()
+
+        return obs, {}
+
+    def _get_obs(self) -> dict[str, EnvObsValType]:
+        pass
+
+    def observe(self, obs_params: Optional[EnvObsParams] = None) -> Any:
+        obs_type = obs_params.obs_type if obs_params else EnvObsType.NONE
+        if obs_type == EnvObsType.NONE:
+            pass
+        elif obs_type == EnvObsType.GET_SCREENSHOT:
+            obs = self.get_screenshot(ss_name=obs_params.ss_name, local_save_dir=obs_params.local_save_dir)
+        elif obs_type == EnvObsType.GET_XML:
+            obs = self.get_xml(xml_name=obs_params.xml_name, local_save_dir=obs_params.local_save_dir)
+        return obs
+
+    def step(self, action: EnvAction) -> tuple[dict[str, Any], float, bool, bool, dict[str, Any]]:
+        res = self._execute_env_action(action)
+
+        obs = {}
+
+        ret = (obs, 1.0, False, False, {"res": res})
+        return ret
+
+    def _execute_env_action(self, action: EnvAction):
+        action_type = action.action_type
+        res = None
+        if action_type == EnvActionType.NONE:
+            pass
+        elif action_type == EnvActionType.SYSTEM_BACK:
+            res = self.system_back()
+        elif action_type == EnvActionType.SYSTEM_TAP:
+            res = self.system_tap(x=action.coord[0], y=action.coord[1])
+        elif action_type == EnvActionType.USER_INPUT:
+            res = self.user_input(input_txt=action.input_txt)
+        elif action_type == EnvActionType.USER_LONGPRESS:
+            res = self.user_longpress(x=action.coord[0], y=action.coord[1])
+        elif action_type == EnvActionType.USER_SWIPE:
+            res = self.user_swipe(x=action.coord[0], y=action.coord[1], orient=action.orient, dist=action.dist)
+        elif action_type == EnvActionType.USER_SWIPE_TO:
+            res = self.user_swipe_to(start=action.coord, end=action.tgt_coord)
+        return res
+
     @property
     def adb_prefix_si(self):
         """adb cmd prefix with `device_id` and `shell input`"""
@@ -42,12 +108,19 @@ def adb_prefix(self):
         return f"adb -s {self.device_id} "
 
     def execute_adb_with_cmd(self, adb_cmd: str) -> str:
+        adb_cmd = adb_cmd.replace("\\", "/")
         res = subprocess.run(adb_cmd, shell=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
         exec_res = ADB_EXEC_FAIL
         if not res.returncode:
             exec_res = res.stdout.strip()
         return exec_res
 
+    def create_device_path(self, folder_path: Path):
+        adb_cmd = f"{self.adb_prefix_shell} mkdir {folder_path} -p"
+        res = self.execute_adb_with_cmd(adb_cmd)
+        if res == ADB_EXEC_FAIL:
+            raise RuntimeError(f"create device path: {folder_path} failed")
+
     @property
     def device_shape(self) -> tuple[int, int]:
         adb_cmd = f"{self.adb_prefix_shell} wm size"
diff --git a/metagpt/environment/android_env/const.py b/metagpt/environment/android/const.py
similarity index 100%
rename from metagpt/environment/android_env/const.py
rename to metagpt/environment/android/const.py
diff --git a/metagpt/environment/android/env_space.py b/metagpt/environment/android/env_space.py
new file mode 100644
index 0000000000..9580e3a7d3
--- /dev/null
+++ b/metagpt/environment/android/env_space.py
@@ -0,0 +1,92 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
+
+from pathlib import Path
+from typing import Union
+
+import numpy as np
+import numpy.typing as npt
+from gymnasium import spaces
+from pydantic import ConfigDict, Field, field_validator
+
+from metagpt.environment.base_env_space import (
+    BaseEnvAction,
+    BaseEnvActionType,
+    BaseEnvObsParams,
+    BaseEnvObsType,
+)
+
+
+class EnvActionType(BaseEnvActionType):
+    NONE = 0  # no action to run, just get observation
+
+    SYSTEM_BACK = 1
+    SYSTEM_TAP = 2
+    USER_INPUT = 3
+    USER_LONGPRESS = 4
+    USER_SWIPE = 5
+    USER_SWIPE_TO = 6
+
+
+class EnvAction(BaseEnvAction):
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+
+    action_type: int = Field(default=EnvActionType.NONE, description="action type")
+    coord: npt.NDArray[np.int64] = Field(
+        default_factory=lambda: np.zeros(2, dtype=np.int64), description="operation coordinate"
+    )
+    tgt_coord: npt.NDArray[np.int64] = Field(
+        default_factory=lambda: np.zeros(2, dtype=np.int64), description="target operation coordinate"
+    )
+    input_txt: str = Field(default="", description="user input text")
+    orient: str = Field(default="up", description="swipe orient")
+    dist: str = Field(default="medium", description="swipe dist")
+
+    @field_validator("coord", "tgt_coord", mode="before")
+    @classmethod
+    def check_coord(cls, coord) -> npt.NDArray[np.int64]:
+        if not isinstance(coord, np.ndarray):
+            return np.array(coord)
+
+
+class EnvObsType(BaseEnvObsType):
+    NONE = 0  # get whole observation from env
+
+    GET_SCREENSHOT = 1
+    GET_XML = 2
+
+
+class EnvObsParams(BaseEnvObsParams):
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+
+    obs_type: int = Field(default=EnvObsType.NONE, description="observation type")
+    ss_name: str = Field(default="", description="screenshot file name")
+    xml_name: str = Field(default="", description="xml file name")
+    local_save_dir: Union[str, Path] = Field(default="", description="local dir to save file")
+
+
+EnvObsValType = str
+
+
+def get_observation_space() -> spaces.Dict:
+    space = spaces.Dict({"screenshot": spaces.Text(256), "xml": spaces.Text(256)})
+    return space
+
+
+def get_action_space(device_shape: tuple[int, int]) -> spaces.Dict:
+    space = spaces.Dict(
+        {
+            "action_type": spaces.Discrete(len(EnvActionType)),
+            "coord": spaces.Box(
+                np.array([0, 0], dtype=np.int64), np.array([device_shape[0], device_shape[1]], dtype=np.int64)
+            ),
+            "tgt_coord": spaces.Box(
+                np.array([0, 0], dtype=np.int64), np.array([device_shape[0], device_shape[1]], dtype=np.int64)
+            ),
+            "input_txt": spaces.Text(256),
+            "orient": spaces.Text(16),
+            "dist": spaces.Text(16),
+        }
+    )
+    return space
diff --git a/metagpt/environment/api/env_api.py b/metagpt/environment/api/env_api.py
index 1e6df544d9..924f6b1041 100644
--- a/metagpt/environment/api/env_api.py
+++ b/metagpt/environment/api/env_api.py
@@ -18,11 +18,11 @@ class EnvAPIAbstract(BaseModel):
 class EnvAPIRegistry(BaseModel):
     """the registry to store environment w&r api/interface"""
 
-    registry: dict[str, dict[str, Union[dict, Any, str]]] = Field(default=dict(), exclude=True)
+    registry: dict[str, Callable] = Field(default=dict(), exclude=True)
 
     def get(self, api_name: str):
         if api_name not in self.registry:
-            raise ValueError
+            raise KeyError(f"api_name: {api_name} not found")
         return self.registry.get(api_name)
 
     def __getitem__(self, api_name: str) -> Callable:
diff --git a/metagpt/environment/base_env.py b/metagpt/environment/base_env.py
index 0e583ffb34..024c468776 100644
--- a/metagpt/environment/base_env.py
+++ b/metagpt/environment/base_env.py
@@ -3,9 +3,12 @@
 # @Desc   : base env of executing environment
 
 import asyncio
+from abc import abstractmethod
 from enum import Enum
 from typing import TYPE_CHECKING, Any, Dict, Iterable, Optional, Set, Union
 
+from gymnasium import spaces
+from gymnasium.core import ActType, ObsType
 from pydantic import BaseModel, ConfigDict, Field, SerializeAsAny, model_validator
 
 from metagpt.context import Context
@@ -14,6 +17,7 @@
     ReadAPIRegistry,
     WriteAPIRegistry,
 )
+from metagpt.environment.base_env_space import BaseEnvAction, BaseEnvObsParams
 from metagpt.logs import logger
 from metagpt.schema import Message
 from metagpt.utils.common import get_function_schema, is_coroutine_func, is_send_to
@@ -26,7 +30,7 @@ class EnvType(Enum):
     ANDROID = "Android"
     GYM = "Gym"
     WEREWOLF = "Werewolf"
-    MINCRAFT = "Mincraft"
+    MINECRAFT = "Minecraft"
     STANFORDTOWN = "StanfordTown"
 
 
@@ -47,7 +51,12 @@ def mark_as_writeable(func):
 
 
 class ExtEnv(BaseModel):
-    """External Env to intergate actual game environment"""
+    """External Env to integrate actual game environment"""
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+
+    action_space: spaces.Space[ActType] = Field(default_factory=spaces.Space, exclude=True)
+    observation_space: spaces.Space[ObsType] = Field(default_factory=spaces.Space, exclude=True)
 
     def _check_api_exist(self, rw_api: Optional[str] = None):
         if not rw_api:
@@ -61,39 +70,56 @@ def get_all_available_apis(self, mode: str = "read") -> list[Any]:
         else:
             return env_write_api_registry.get_apis()
 
-    async def observe(self, env_action: Union[str, EnvAPIAbstract]):
+    async def read_from_api(self, env_action: Union[str, EnvAPIAbstract]):
         """get observation from particular api of ExtEnv"""
         if isinstance(env_action, str):
-            read_api = env_read_api_registry.get(api_name=env_action)["func"]
-            self._check_api_exist(read_api)
-            if is_coroutine_func(read_api):
-                res = await read_api(self)
+            env_read_api = env_read_api_registry.get(api_name=env_action)["func"]
+            self._check_api_exist(env_read_api)
+            if is_coroutine_func(env_read_api):
+                res = await env_read_api(self)
             else:
-                res = read_api(self)
+                res = env_read_api(self)
         elif isinstance(env_action, EnvAPIAbstract):
-            read_api = env_read_api_registry.get(api_name=env_action.api_name)["func"]
-            self._check_api_exist(read_api)
-            if is_coroutine_func(read_api):
-                res = await read_api(self, *env_action.args, **env_action.kwargs)
+            env_read_api = env_read_api_registry.get(api_name=env_action.api_name)["func"]
+            self._check_api_exist(env_read_api)
+            if is_coroutine_func(env_read_api):
+                res = await env_read_api(self, *env_action.args, **env_action.kwargs)
             else:
-                res = read_api(self, *env_action.args, **env_action.kwargs)
+                res = env_read_api(self, *env_action.args, **env_action.kwargs)
         return res
 
-    async def step(self, env_action: Union[str, Message, EnvAPIAbstract, list[EnvAPIAbstract]]):
+    async def write_thru_api(self, env_action: Union[str, Message, EnvAPIAbstract, list[EnvAPIAbstract]]):
         """execute through particular api of ExtEnv"""
         res = None
         if isinstance(env_action, Message):
             self.publish_message(env_action)
         elif isinstance(env_action, EnvAPIAbstract):
-            write_api = env_write_api_registry.get(env_action.api_name)["func"]
-            self._check_api_exist(write_api)
-            if is_coroutine_func(write_api):
-                res = await write_api(self, *env_action.args, **env_action.kwargs)
+            env_write_api = env_write_api_registry.get(env_action.api_name)["func"]
+            self._check_api_exist(env_write_api)
+            if is_coroutine_func(env_write_api):
+                res = await env_write_api(self, *env_action.args, **env_action.kwargs)
             else:
-                res = write_api(self, *env_action.args, **env_action.kwargs)
+                res = env_write_api(self, *env_action.args, **env_action.kwargs)
 
         return res
 
+    @abstractmethod
+    def reset(
+        self,
+        *,
+        seed: Optional[int] = None,
+        options: Optional[dict[str, Any]] = None,
+    ) -> tuple[dict[str, Any], dict[str, Any]]:
+        """Implement this to get init observation"""
+
+    @abstractmethod
+    def observe(self, obs_params: Optional[BaseEnvObsParams] = None) -> Any:
+        """Implement this if you want to get partial observation from the env"""
+
+    @abstractmethod
+    def step(self, action: BaseEnvAction) -> tuple[dict[str, Any], float, bool, bool, dict[str, Any]]:
+        """Implement this to feed a action and then get new observation from the env"""
+
 
 class Environment(ExtEnv):
     """环境，承载一批角色，角色可以向环境发布消息，可以被其他角色观察到
@@ -108,6 +134,20 @@ class Environment(ExtEnv):
     history: str = ""  # For debug
     context: Context = Field(default_factory=Context, exclude=True)
 
+    def reset(
+        self,
+        *,
+        seed: Optional[int] = None,
+        options: Optional[dict[str, Any]] = None,
+    ) -> tuple[dict[str, Any], dict[str, Any]]:
+        pass
+
+    def observe(self, obs_params: Optional[BaseEnvObsParams] = None) -> Any:
+        pass
+
+    def step(self, action: BaseEnvAction) -> tuple[dict[str, Any], float, bool, bool, dict[str, Any]]:
+        pass
+
     @model_validator(mode="after")
     def init_roles(self):
         self.add_roles(self.roles.values())
@@ -129,8 +169,8 @@ def add_roles(self, roles: Iterable["Role"]):
             self.roles[role.profile] = role
 
         for role in roles:  # setup system message with roles
-            role.set_env(self)
             role.context = self.context
+            role.set_env(self)
 
     def publish_message(self, message: Message, peekable: bool = True) -> bool:
         """
diff --git a/metagpt/environment/base_env_space.py b/metagpt/environment/base_env_space.py
new file mode 100644
index 0000000000..fd0cfa399f
--- /dev/null
+++ b/metagpt/environment/base_env_space.py
@@ -0,0 +1,33 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
+
+from enum import IntEnum
+
+from pydantic import BaseModel, ConfigDict, Field
+
+
+class BaseEnvActionType(IntEnum):
+    # # NONE = 0  # no action to run, just get observation
+    pass
+
+
+class BaseEnvAction(BaseModel):
+    """env action type and its related params of action functions/apis"""
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+
+    action_type: int = Field(default=0, description="action type")
+
+
+class BaseEnvObsType(IntEnum):
+    # # NONE = 0                     # get whole observation from env
+    pass
+
+
+class BaseEnvObsParams(BaseModel):
+    """observation params for different EnvObsType to get its observe result"""
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+
+    obs_type: int = Field(default=0, description="observation type")
diff --git a/metagpt/environment/software_env/__init__.py b/metagpt/environment/minecraft/__init__.py
similarity index 100%
rename from metagpt/environment/software_env/__init__.py
rename to metagpt/environment/minecraft/__init__.py
diff --git a/metagpt/environment/mincraft_env/const.py b/metagpt/environment/minecraft/const.py
similarity index 92%
rename from metagpt/environment/mincraft_env/const.py
rename to metagpt/environment/minecraft/const.py
index a7222f9cd4..8ac15decc8 100644
--- a/metagpt/environment/mincraft_env/const.py
+++ b/metagpt/environment/minecraft/const.py
@@ -4,8 +4,8 @@
 
 from metagpt.const import METAGPT_ROOT
 
-# For Mincraft Game Agent
-MC_CKPT_DIR = METAGPT_ROOT / "data/mincraft/ckpt"
+# For Minecraft Game Agent
+MC_CKPT_DIR = METAGPT_ROOT / "data/minecraft/ckpt"
 MC_LOG_DIR = METAGPT_ROOT / "logs"
 MC_DEFAULT_WARMUP = {
     "context": 15,
diff --git a/metagpt/environment/mincraft_env/mincraft_env.py b/metagpt/environment/minecraft/minecraft_env.py
similarity index 93%
rename from metagpt/environment/mincraft_env/mincraft_env.py
rename to metagpt/environment/minecraft/minecraft_env.py
index 6327aa3f4b..31a48964bb 100644
--- a/metagpt/environment/mincraft_env/mincraft_env.py
+++ b/metagpt/environment/minecraft/minecraft_env.py
@@ -1,6 +1,6 @@
 #!/usr/bin/env python
 # -*- coding: utf-8 -*-
-# @Desc   : MG Mincraft Env
+# @Desc   : MG Minecraft Env
 #           refs to `voyager voyager.py`
 
 import json
@@ -8,20 +8,19 @@
 import time
 from typing import Any, Iterable
 
-from langchain.embeddings.openai import OpenAIEmbeddings
-from langchain.vectorstores import Chroma
+from llama_index.vector_stores.chroma import ChromaVectorStore
 from pydantic import ConfigDict, Field
 
 from metagpt.config2 import config as CONFIG
 from metagpt.environment.base_env import Environment
-from metagpt.environment.mincraft_env.const import MC_CKPT_DIR
-from metagpt.environment.mincraft_env.mincraft_ext_env import MincraftExtEnv
+from metagpt.environment.minecraft.const import MC_CKPT_DIR
+from metagpt.environment.minecraft.minecraft_ext_env import MinecraftExtEnv
 from metagpt.logs import logger
 from metagpt.utils.common import load_mc_skills_code, read_json_file, write_json_file
 
 
-class MincraftEnv(Environment, MincraftExtEnv):
-    """MincraftEnv, including shared memory of cache and infomation between roles"""
+class MinecraftEnv(MinecraftExtEnv, Environment):
+    """MinecraftEnv, including shared memory of cache and information between roles"""
 
     model_config = ConfigDict(arbitrary_types_allowed=True)
 
@@ -48,9 +47,9 @@ class MincraftEnv(Environment, MincraftExtEnv):
 
     runtime_status: bool = False  # equal to action execution status: success or failed
 
-    vectordb: Chroma = Field(default_factory=Chroma)
+    vectordb: ChromaVectorStore = Field(default_factory=ChromaVectorStore)
 
-    qa_cache_questions_vectordb: Chroma = Field(default_factory=Chroma)
+    qa_cache_questions_vectordb: ChromaVectorStore = Field(default_factory=ChromaVectorStore)
 
     @property
     def progress(self):
@@ -73,16 +72,14 @@ def set_mc_port(self, mc_port):
         self.set_mc_resume()
 
     def set_mc_resume(self):
-        self.qa_cache_questions_vectordb = Chroma(
+        self.qa_cache_questions_vectordb = ChromaVectorStore(
             collection_name="qa_cache_questions_vectordb",
-            embedding_function=OpenAIEmbeddings(),
-            persist_directory=f"{MC_CKPT_DIR}/curriculum/vectordb",
+            persist_dir=f"{MC_CKPT_DIR}/curriculum/vectordb",
         )
 
-        self.vectordb = Chroma(
+        self.vectordb = ChromaVectorStore(
             collection_name="skill_vectordb",
-            embedding_function=OpenAIEmbeddings(),
-            persist_directory=f"{MC_CKPT_DIR}/skill/vectordb",
+            persist_dir=f"{MC_CKPT_DIR}/skill/vectordb",
         )
 
         if CONFIG.resume:
@@ -285,7 +282,7 @@ def update_exploration_progress(self, success: bool):
                     position = event["status"]["position"]
                     blocks.append(block)
                     positions.append(position)
-            new_events = self.step(
+            new_events = self._step(
                 f"await givePlacedItemBack(bot, {json.dumps(blocks)}, {json.dumps(positions)})",
                 programs=self.programs,
             )
@@ -326,7 +323,7 @@ async def on_event_retrieve(self, *args):
                 Exception: If there is an issue retrieving events.
         """
         try:
-            self.reset(
+            self._reset(
                 options={
                     "mode": "soft",
                     "wait_ticks": 20,
@@ -335,13 +332,13 @@ async def on_event_retrieve(self, *args):
             # difficulty = "easy" if len(self.completed_tasks) > 15 else "peaceful"
             difficulty = "peaceful"
 
-            events = self.step("bot.chat(`/time set ${getNextTime()}`);\n" + f"bot.chat('/difficulty {difficulty}');")
+            events = self._step("bot.chat(`/time set ${getNextTime()}`);\n" + f"bot.chat('/difficulty {difficulty}');")
             self.update_event(events)
             return events
         except Exception as e:
             time.sleep(3)  # wait for mineflayer to exit
             # reset bot status here
-            events = self.reset(
+            events = self._reset(
                 options={
                     "mode": "hard",
                     "wait_ticks": 20,
@@ -368,7 +365,7 @@ async def on_event_execute(self, *args):
                 Exception: If there is an issue retrieving events.
         """
         try:
-            events = self.step(
+            events = self._step(
                 code=self.code,
                 programs=self.programs,
             )
@@ -377,7 +374,7 @@ async def on_event_execute(self, *args):
         except Exception as e:
             time.sleep(3)  # wait for mineflayer to exit
             # reset bot status here
-            events = self.reset(
+            events = self._reset(
                 options={
                     "mode": "hard",
                     "wait_ticks": 20,
diff --git a/metagpt/environment/mincraft_env/mincraft_ext_env.py b/metagpt/environment/minecraft/minecraft_ext_env.py
similarity index 87%
rename from metagpt/environment/mincraft_env/mincraft_ext_env.py
rename to metagpt/environment/minecraft/minecraft_ext_env.py
index b86250d8cd..0436bc3aa0 100644
--- a/metagpt/environment/mincraft_env/mincraft_ext_env.py
+++ b/metagpt/environment/minecraft/minecraft_ext_env.py
@@ -1,28 +1,29 @@
 #!/usr/bin/env python
 # -*- coding: utf-8 -*-
-# @Desc   : The Mincraft external environment to integrate with Mincraft game
+# @Desc   : The Minecraft external environment to integrate with Minecraft game
 #           refs to `voyager bridge.py`
 
 import json
 import time
-from typing import Optional
+from typing import Any, Optional
 
 import requests
 from pydantic import ConfigDict, Field, model_validator
 
 from metagpt.environment.base_env import ExtEnv, mark_as_writeable
-from metagpt.environment.mincraft_env.const import (
+from metagpt.environment.base_env_space import BaseEnvAction, BaseEnvObsParams
+from metagpt.environment.minecraft.const import (
     MC_CKPT_DIR,
     MC_CORE_INVENTORY_ITEMS,
     MC_CURRICULUM_OB,
     MC_DEFAULT_WARMUP,
     METAGPT_ROOT,
 )
-from metagpt.environment.mincraft_env.process_monitor import SubprocessMonitor
+from metagpt.environment.minecraft.process_monitor import SubprocessMonitor
 from metagpt.logs import logger
 
 
-class MincraftExtEnv(ExtEnv):
+class MinecraftExtEnv(ExtEnv):
     model_config = ConfigDict(arbitrary_types_allowed=True)
 
     mc_port: Optional[int] = Field(default=None)
@@ -38,6 +39,20 @@ class MincraftExtEnv(ExtEnv):
     server_paused: bool = Field(default=False)
     warm_up: dict = Field(default=dict())
 
+    def reset(
+        self,
+        *,
+        seed: Optional[int] = None,
+        options: Optional[dict[str, Any]] = None,
+    ) -> tuple[dict[str, Any], dict[str, Any]]:
+        pass
+
+    def observe(self, obs_params: Optional[BaseEnvObsParams] = None) -> Any:
+        pass
+
+    def step(self, action: BaseEnvAction) -> tuple[dict[str, Any], float, bool, bool, dict[str, Any]]:
+        pass
+
     @property
     def server(self) -> str:
         return f"{self.server_host}:{self.server_port}"
@@ -48,7 +63,7 @@ def _post_init_ext_env(self):
             self.mineflayer = SubprocessMonitor(
                 commands=[
                     "node",
-                    METAGPT_ROOT.joinpath("metagpt", "environment", "mincraft_env", "mineflayer", "index.js"),
+                    METAGPT_ROOT.joinpath("metagpt", "environment", "minecraft", "mineflayer", "index.js"),
                     str(self.server_port),
                 ],
                 name="mineflayer",
@@ -115,7 +130,7 @@ def check_process(self) -> dict:
             return res.json()
 
     @mark_as_writeable
-    def reset(self, *, seed=None, options=None) -> dict:
+    def _reset(self, *, seed=None, options=None) -> dict:
         if options is None:
             options = {}
         if options.get("inventory", {}) and options.get("mode", "hard") != "hard":
@@ -145,7 +160,7 @@ def reset(self, *, seed=None, options=None) -> dict:
         return json.loads(returned_data)
 
     @mark_as_writeable
-    def step(self, code: str, programs: str = "") -> dict:
+    def _step(self, code: str, programs: str = "") -> dict:
         if not self.has_reset:
             raise RuntimeError("Environment has not been reset yet")
         self.check_process()
diff --git a/metagpt/environment/mincraft_env/mineflayer/.gitignore b/metagpt/environment/minecraft/mineflayer/.gitignore
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/.gitignore
rename to metagpt/environment/minecraft/mineflayer/.gitignore
diff --git a/metagpt/environment/mincraft_env/mineflayer/.prettierignore b/metagpt/environment/minecraft/mineflayer/.prettierignore
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/.prettierignore
rename to metagpt/environment/minecraft/mineflayer/.prettierignore
diff --git a/metagpt/environment/mincraft_env/mineflayer/.prettierrc.json b/metagpt/environment/minecraft/mineflayer/.prettierrc.json
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/.prettierrc.json
rename to metagpt/environment/minecraft/mineflayer/.prettierrc.json
diff --git a/metagpt/environment/mincraft_env/mineflayer/index.js b/metagpt/environment/minecraft/mineflayer/index.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/index.js
rename to metagpt/environment/minecraft/mineflayer/index.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/lib/observation/base.js b/metagpt/environment/minecraft/mineflayer/lib/observation/base.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/lib/observation/base.js
rename to metagpt/environment/minecraft/mineflayer/lib/observation/base.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/lib/observation/chests.js b/metagpt/environment/minecraft/mineflayer/lib/observation/chests.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/lib/observation/chests.js
rename to metagpt/environment/minecraft/mineflayer/lib/observation/chests.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/lib/observation/inventory.js b/metagpt/environment/minecraft/mineflayer/lib/observation/inventory.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/lib/observation/inventory.js
rename to metagpt/environment/minecraft/mineflayer/lib/observation/inventory.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/lib/observation/onChat.js b/metagpt/environment/minecraft/mineflayer/lib/observation/onChat.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/lib/observation/onChat.js
rename to metagpt/environment/minecraft/mineflayer/lib/observation/onChat.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/lib/observation/onError.js b/metagpt/environment/minecraft/mineflayer/lib/observation/onError.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/lib/observation/onError.js
rename to metagpt/environment/minecraft/mineflayer/lib/observation/onError.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/lib/observation/onSave.js b/metagpt/environment/minecraft/mineflayer/lib/observation/onSave.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/lib/observation/onSave.js
rename to metagpt/environment/minecraft/mineflayer/lib/observation/onSave.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/lib/observation/status.js b/metagpt/environment/minecraft/mineflayer/lib/observation/status.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/lib/observation/status.js
rename to metagpt/environment/minecraft/mineflayer/lib/observation/status.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/lib/observation/voxels.js b/metagpt/environment/minecraft/mineflayer/lib/observation/voxels.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/lib/observation/voxels.js
rename to metagpt/environment/minecraft/mineflayer/lib/observation/voxels.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/lib/skillLoader.js b/metagpt/environment/minecraft/mineflayer/lib/skillLoader.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/lib/skillLoader.js
rename to metagpt/environment/minecraft/mineflayer/lib/skillLoader.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/lib/utils.js b/metagpt/environment/minecraft/mineflayer/lib/utils.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/lib/utils.js
rename to metagpt/environment/minecraft/mineflayer/lib/utils.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/.gitignore b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/.gitignore
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/.gitignore
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/.gitignore
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/LICENSE b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/LICENSE
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/LICENSE
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/LICENSE
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/README.md b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/README.md
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/README.md
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/README.md
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/_config.yml b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/_config.yml
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/_config.yml
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/_config.yml
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/docs/api.md b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/docs/api.md
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/docs/api.md
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/docs/api.md
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/examples/collector.js b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/examples/collector.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/examples/collector.js
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/examples/collector.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/examples/oreMiner.js b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/examples/oreMiner.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/examples/oreMiner.js
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/examples/oreMiner.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/examples/storageBot.js b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/examples/storageBot.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/examples/storageBot.js
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/examples/storageBot.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/package.json b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/package.json
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/package.json
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/package.json
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/BlockVeins.ts b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/BlockVeins.ts
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/BlockVeins.ts
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/BlockVeins.ts
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/CollectBlock.ts b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/CollectBlock.ts
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/CollectBlock.ts
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/CollectBlock.ts
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/Inventory.ts b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/Inventory.ts
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/Inventory.ts
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/Inventory.ts
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/Targets.ts b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/Targets.ts
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/Targets.ts
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/Targets.ts
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/TaskQueue.ts b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/TaskQueue.ts
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/TaskQueue.ts
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/TaskQueue.ts
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/TemporarySubscriber.ts b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/TemporarySubscriber.ts
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/TemporarySubscriber.ts
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/TemporarySubscriber.ts
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/Util.ts b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/Util.ts
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/Util.ts
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/Util.ts
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/index.ts b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/index.ts
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/index.ts
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/index.ts
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/tsconfig.json b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/tsconfig.json
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/tsconfig.json
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/tsconfig.json
diff --git a/metagpt/environment/mincraft_env/mineflayer/package.json b/metagpt/environment/minecraft/mineflayer/package.json
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/package.json
rename to metagpt/environment/minecraft/mineflayer/package.json
diff --git a/metagpt/environment/mincraft_env/process_monitor.py b/metagpt/environment/minecraft/process_monitor.py
similarity index 100%
rename from metagpt/environment/mincraft_env/process_monitor.py
rename to metagpt/environment/minecraft/process_monitor.py
diff --git a/metagpt/environment/stanford_town_env/__init__.py b/metagpt/environment/software/__init__.py
similarity index 100%
rename from metagpt/environment/stanford_town_env/__init__.py
rename to metagpt/environment/software/__init__.py
diff --git a/metagpt/environment/software_env/software_env.py b/metagpt/environment/software/software_env.py
similarity index 100%
rename from metagpt/environment/software_env/software_env.py
rename to metagpt/environment/software/software_env.py
diff --git a/metagpt/environment/werewolf_env/__init__.py b/metagpt/environment/stanford_town/__init__.py
similarity index 100%
rename from metagpt/environment/werewolf_env/__init__.py
rename to metagpt/environment/stanford_town/__init__.py
diff --git a/metagpt/environment/stanford_town/env_space.py b/metagpt/environment/stanford_town/env_space.py
new file mode 100644
index 0000000000..e100a29527
--- /dev/null
+++ b/metagpt/environment/stanford_town/env_space.py
@@ -0,0 +1,105 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
+
+from typing import Any, Optional, Union
+
+import numpy as np
+import numpy.typing as npt
+from gymnasium import spaces
+from pydantic import ConfigDict, Field, field_validator
+
+from metagpt.environment.base_env_space import (
+    BaseEnvAction,
+    BaseEnvActionType,
+    BaseEnvObsParams,
+    BaseEnvObsType,
+)
+
+
+class EnvActionType(BaseEnvActionType):
+    NONE = 0  # no action to run, just get observation
+
+    ADD_TILE_EVENT = 1  # Add an event triple to a tile
+    RM_TILE_EVENT = 2  # Remove an event triple from a tile
+    TURN_TILE_EVENT_IDLE = 3  # Turn an event triple from a tile into idle
+    RM_TITLE_SUB_EVENT = 4  # Remove an event triple that has the input subject from a tile
+
+
+class EnvAction(BaseEnvAction):
+    """env action type and its related params of action functions/apis"""
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+
+    action_type: int = Field(default=EnvActionType.NONE, description="action type")
+    coord: npt.NDArray[np.int64] = Field(
+        default_factory=lambda: np.zeros(2, dtype=np.int64), description="tile coordinate"
+    )
+    subject: str = Field(default="", description="subject name of first element in event")
+    event: tuple[str, Optional[str], Optional[str], Optional[str]] = Field(
+        default=["", None, None, None], description="tile event"
+    )
+
+    @field_validator("coord", mode="before")
+    @classmethod
+    def check_coord(cls, coord) -> npt.NDArray[np.int64]:
+        if not isinstance(coord, np.ndarray):
+            return np.array(coord)
+
+
+class EnvObsType(BaseEnvObsType):
+    """get part observation with specific params"""
+
+    NONE = 0  # get whole observation from env
+
+    GET_TITLE = 1  # get the tile detail dictionary with given tile coord
+    TILE_PATH = 2  # get the tile address with given tile coord
+    TILE_NBR = 3  # get the neighbors of given tile coord and its vision radius
+
+
+class EnvObsParams(BaseEnvObsParams):
+    """observation params for different EnvObsType"""
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+
+    obs_type: int = Field(default=EnvObsType.NONE, description="observation type")
+    coord: npt.NDArray[np.int64] = Field(
+        default_factory=lambda: np.zeros(2, dtype=np.int64), description="tile coordinate"
+    )
+    level: str = Field(default="", description="different level of title")
+    vision_radius: int = Field(default=0, description="the vision radius of current tile")
+
+    @field_validator("coord", mode="before")
+    @classmethod
+    def check_coord(cls, coord) -> npt.NDArray[np.int64]:
+        if not isinstance(coord, np.ndarray):
+            return np.array(coord)
+
+
+EnvObsValType = Union[list[list[str]], dict[str, set[tuple[int, int]]], list[list[dict[str, Any]]]]
+
+
+def get_observation_space() -> spaces.Dict:
+    # it's a
+    space = spaces.Dict(
+        {"collision_maze": spaces.Discrete(2), "tiles": spaces.Discrete(2), "address_tiles": spaces.Discrete(2)}
+    )
+
+    return space
+
+
+def get_action_space(maze_shape: tuple[int, int]) -> spaces.Dict:
+    """The fields defined by the space correspond to the input parameters of the action except `action_type`"""
+    space = spaces.Dict(
+        {
+            "action_type": spaces.Discrete(len(EnvActionType)),
+            "coord": spaces.Box(
+                np.array([0, 0], dtype=np.int64), np.array([maze_shape[0], maze_shape[1]], dtype=np.int64)
+            ),  # coord of the tile
+            "subject": spaces.Text(256),  # the first element of an tile event
+            "event": spaces.Tuple(
+                (spaces.Text(256), spaces.Text(256), spaces.Text(256), spaces.Text(256))
+            ),  # event is a tuple of four str
+        }
+    )
+    return space
diff --git a/metagpt/environment/stanford_town/stanford_town_env.py b/metagpt/environment/stanford_town/stanford_town_env.py
new file mode 100644
index 0000000000..af8a882b2d
--- /dev/null
+++ b/metagpt/environment/stanford_town/stanford_town_env.py
@@ -0,0 +1,10 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : MG StanfordTown Env
+
+from metagpt.environment.base_env import Environment
+from metagpt.environment.stanford_town.stanford_town_ext_env import StanfordTownExtEnv
+
+
+class StanfordTownEnv(StanfordTownExtEnv, Environment):
+    pass
diff --git a/metagpt/environment/stanford_town_env/stanford_town_ext_env.py b/metagpt/environment/stanford_town/stanford_town_ext_env.py
similarity index 83%
rename from metagpt/environment/stanford_town_env/stanford_town_ext_env.py
rename to metagpt/environment/stanford_town/stanford_town_ext_env.py
index 8a9a659659..30a02d4dbe 100644
--- a/metagpt/environment/stanford_town_env/stanford_town_ext_env.py
+++ b/metagpt/environment/stanford_town/stanford_town_ext_env.py
@@ -5,11 +5,20 @@
 
 import math
 from pathlib import Path
-from typing import Optional, Tuple
+from typing import Any, Optional
 
 from pydantic import ConfigDict, Field, model_validator
 
 from metagpt.environment.base_env import ExtEnv, mark_as_readable, mark_as_writeable
+from metagpt.environment.stanford_town.env_space import (
+    EnvAction,
+    EnvActionType,
+    EnvObsParams,
+    EnvObsType,
+    EnvObsValType,
+    get_action_space,
+    get_observation_space,
+)
 from metagpt.utils.common import read_csv_to_list, read_json_file
 
 
@@ -197,15 +206,82 @@ def _init_maze(cls, values):
                     else:
                         address_tiles[add] = set([(j, i)])
         values["address_tiles"] = address_tiles
+
+        values["action_space"] = get_action_space((maze_width, maze_height))
+        values["observation_space"] = get_observation_space()
         return values
 
+    def reset(
+        self,
+        *,
+        seed: Optional[int] = None,
+        options: Optional[dict[str, Any]] = None,
+    ) -> tuple[dict[str, EnvObsValType], dict[str, Any]]:
+        """reset env and get the init observation
+        Return results corresponding to `observation, info`
+        """
+        super().reset(seed=seed, options=options)
+
+        obs = self._get_obs()
+
+        return obs, {}
+
+    def _get_obs(self) -> dict[str, EnvObsValType]:
+        """Get observation"""
+        return {
+            "collision_maze": self.get_collision_maze(),
+            "tiles": self.tiles,
+            "address_tiles": self.get_address_tiles(),
+        }
+
+    def observe(self, obs_params: Optional[EnvObsParams] = None) -> Any:
+        """Get partial or full observation from the env"""
+        obs_type = obs_params.obs_type if obs_params else EnvObsType.NONE
+        if obs_type == EnvObsType.NONE:
+            obs = self._get_obs()
+        elif obs_type == EnvObsType.GET_TITLE:
+            obs = self.access_tile(tile=obs_params.coord)
+        elif obs_type == EnvObsType.TILE_PATH:
+            obs = self.get_tile_path(tile=obs_params.coord, level=obs_params.level)
+        elif obs_type == EnvObsType.TILE_NBR:
+            obs = self.get_nearby_tiles(tile=obs_params.coord, vision_r=obs_params.vision_radius)
+        return obs
+
+    def step(self, action: EnvAction) -> tuple[dict[str, EnvObsValType], float, bool, bool, dict[str, Any]]:
+        """Execute action and then return observation
+        Return results corresponding to `observation, reward, terminated, truncated, info`
+        """
+        terminated = False
+        try:
+            self._execute_env_action(action)
+        except Exception:
+            terminated = True
+
+        obs = self._get_obs()
+
+        ret = (obs, 1.0, terminated, False, {})
+        return ret
+
+    def _execute_env_action(self, action: EnvAction):
+        action_type = action.action_type
+        if action_type == EnvActionType.NONE:
+            pass
+        elif action_type == EnvActionType.ADD_TILE_EVENT:
+            self.add_event_from_tile(curr_event=action.event, tile=action.coord)
+        elif action_type == EnvActionType.RM_TILE_EVENT:
+            self.remove_event_from_tile(curr_event=action.event, tile=action.coord)
+        elif action_type == EnvActionType.TURN_TILE_EVENT_IDLE:
+            self.turn_event_from_tile_idle(curr_event=action.event, tile=action.coord)
+        elif action_type == EnvActionType.RM_TITLE_SUB_EVENT:
+            self.remove_subject_events_from_tile(subject=action.subject, tile=action.coord)
+
     def turn_coordinate_to_tile(self, px_coordinate: tuple[int, int]) -> tuple[int, int]:
         """
         Turns a pixel coordinate to a tile coordinate.
         """
         x = math.ceil(px_coordinate[0] / self.sq_tile_size)
         y = math.ceil(px_coordinate[1] / self.sq_tile_size)
-        return (x, y)
+        return x, y
 
     @mark_as_readable
     def get_collision_maze(self) -> list:
@@ -316,10 +392,6 @@ def get_nearby_tiles(self, tile: tuple[int, int], vision_r: int) -> list[tuple[i
                 nearby_tiles += [(i, j)]
         return nearby_tiles
 
-    @mark_as_writeable
-    def add_tiles_event(self, pt_y: int, pt_x: int, event: Tuple[str, str, str, str]):
-        self.tiles[pt_y][pt_x]["events"].add(event)
-
     @mark_as_writeable
     def add_event_from_tile(self, curr_event: tuple[str], tile: tuple[int, int]) -> None:
         """
diff --git a/metagpt/environment/stanford_town_env/stanford_town_env.py b/metagpt/environment/stanford_town_env/stanford_town_env.py
deleted file mode 100644
index 8721d6cd18..0000000000
--- a/metagpt/environment/stanford_town_env/stanford_town_env.py
+++ /dev/null
@@ -1,12 +0,0 @@
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-# @Desc   : MG StanfordTown Env
-
-from metagpt.environment.base_env import Environment
-from metagpt.environment.stanford_town_env.stanford_town_ext_env import (
-    StanfordTownExtEnv,
-)
-
-
-class StanfordTownEnv(Environment, StanfordTownExtEnv):
-    pass
diff --git a/tests/metagpt/environment/mincraft_env/__init__.py b/metagpt/environment/werewolf/__init__.py
similarity index 100%
rename from tests/metagpt/environment/mincraft_env/__init__.py
rename to metagpt/environment/werewolf/__init__.py
diff --git a/metagpt/environment/werewolf/const.py b/metagpt/environment/werewolf/const.py
new file mode 100644
index 0000000000..7f810389da
--- /dev/null
+++ b/metagpt/environment/werewolf/const.py
@@ -0,0 +1,121 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
+
+from enum import Enum
+
+from metagpt.const import MESSAGE_ROUTE_TO_ALL
+
+
+class RoleType(Enum):
+    VILLAGER = "Villager"
+    WEREWOLF = "Werewolf"
+    GUARD = "Guard"
+    SEER = "Seer"
+    WITCH = "Witch"
+    MODERATOR = "Moderator"
+
+
+class RoleState(Enum):
+    ALIVE = "alive"  # the role is alive
+    DEAD = "dead"  # killed or poisoned
+    KILLED = "killed"  # killed by werewolf or voting
+    POISONED = "poisoned"  # killed by poison
+    SAVED = "saved"  # saved by antidote
+    PROTECTED = "projected"  # projected by guard
+
+
+class RoleActionRes(Enum):
+    SAVE = "save"
+    PASS = "pass"  # ignore current action output
+
+
+empty_set = set()
+
+# the ordered rules by the moderator to announce to everyone each step
+STEP_INSTRUCTIONS = {
+    0: {
+        "content": "It’s dark, everyone close your eyes. I will talk with you/your team secretly at night.",
+        "send_to": {RoleType.MODERATOR.value},  # for moderator to continue speaking
+        "restricted_to": empty_set,
+    },
+    1: {
+        "content": "Guard, please open your eyes!",
+        "send_to": {RoleType.MODERATOR.value},  # for moderator to continue speaking
+        "restricted_to": empty_set,
+    },
+    2: {
+        "content": """Guard, now tell me who you protect tonight?
+You only choose one from the following living options please: {living_players}.
+Or you can pass. For example: Protect ...""",
+        "send_to": {RoleType.GUARD.value},
+        "restricted_to": {RoleType.MODERATOR.value, RoleType.GUARD.value},
+    },
+    3: {"content": "Guard, close your eyes", "send_to": {RoleType.MODERATOR.value}, "restricted_to": empty_set},
+    4: {
+        "content": "Werewolves, please open your eyes!",
+        "send_to": {RoleType.MODERATOR.value},
+        "restricted_to": empty_set,
+    },
+    5: {
+        "content": """Werewolves, I secretly tell you that {werewolf_players} are
+all of the {werewolf_num} werewolves! Keep in mind you are teammates. The rest players are not werewolves.
+choose one from the following living options please:
+{living_players}. For example: Kill ...""",
+        "send_to": {RoleType.WEREWOLF.value},
+        "restricted_to": {RoleType.MODERATOR.value, RoleType.WEREWOLF.value},
+    },
+    6: {"content": "Werewolves, close your eyes", "send_to": {RoleType.MODERATOR.value}, "restricted_to": empty_set},
+    7: {"content": "Witch, please open your eyes!", "send_to": {RoleType.MODERATOR.value}, "restricted_to": empty_set},
+    8: {
+        "content": """Witch, tonight {player_hunted} has been killed by the werewolves.
+You have a bottle of antidote, would you like to save him/her? If so, say "Save", else, say "Pass".""",
+        "send_to": {RoleType.WITCH.value},
+        "restricted_to": {RoleType.MODERATOR.value, RoleType.WITCH.value},
+    },  # 要先判断女巫是否有解药，再去询问女巫是否使用解药救人
+    9: {
+        "content": """Witch, you also have a bottle of poison, would you like to use it to kill one of the living players?
+Choose one from the following living options: {living_players}.
+If so, say ONLY "Poison PlayerX", replace PlayerX with the actual player name, else, say "Pass".""",
+        "send_to": {RoleType.WITCH.value},
+        "restricted_to": {RoleType.MODERATOR.value, RoleType.WITCH.value},
+    },  #
+    10: {"content": "Witch, close your eyes", "send_to": {RoleType.MODERATOR.value}, "restricted_to": empty_set},
+    11: {"content": "Seer, please open your eyes!", "send_to": {RoleType.MODERATOR.value}, "restricted_to": empty_set},
+    12: {
+        "content": """Seer, you can check one player's identity. Who are you going to verify its identity tonight?
+Choose only one from the following living options:{living_players}.""",
+        "send_to": {RoleType.SEER.value},
+        "restricted_to": {RoleType.MODERATOR.value, RoleType.SEER.value},
+    },
+    13: {"content": "Seer, close your eyes", "send_to": {RoleType.MODERATOR.value}, "restricted_to": empty_set},
+    # The 1-st daytime
+    14: {
+        "content": """It's daytime. Everyone woke up except those who had been killed.""",
+        "send_to": {RoleType.MODERATOR.value},
+        "restricted_to": empty_set,
+    },
+    15: {
+        "content": "{player_current_dead} was killed last night!",
+        "send_to": {RoleType.MODERATOR.value},
+        "restricted_to": empty_set,
+    },
+    16: {
+        "content": """Living players: {living_players}, now freely talk about the current situation based on your observation and
+reflection with a few sentences. Decide whether to reveal your identity based on your reflection.""",
+        "send_to": {MESSAGE_ROUTE_TO_ALL},  # send to all to speak in daytime
+        "restricted_to": empty_set,
+    },
+    17: {
+        "content": """Now vote and tell me who you think is the werewolf. Don’t mention your role.
+You only choose one from the following living options please:
+{living_players}. Say ONLY: I vote to eliminate ...""",
+        "send_to": {MESSAGE_ROUTE_TO_ALL},
+        "restricted_to": empty_set,
+    },
+    18: {
+        "content": """{player_current_dead} was eliminated.""",
+        "send_to": {RoleType.MODERATOR.value},
+        "restricted_to": empty_set,
+    },
+}
diff --git a/metagpt/environment/werewolf/env_space.py b/metagpt/environment/werewolf/env_space.py
new file mode 100644
index 0000000000..30a0fa01d3
--- /dev/null
+++ b/metagpt/environment/werewolf/env_space.py
@@ -0,0 +1,60 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : werewolf observation/action space and its action definition
+
+from gymnasium import spaces
+from pydantic import ConfigDict, Field
+
+from metagpt.environment.base_env_space import BaseEnvAction, BaseEnvActionType
+from metagpt.environment.werewolf.const import STEP_INSTRUCTIONS
+
+
+class EnvActionType(BaseEnvActionType):
+    NONE = 0  # no action to run, just get observation
+    WOLF_KILL = 1  # wolf kill someone
+    VOTE_KILL = 2  # vote kill someone
+    WITCH_POISON = 3  # witch poison someone
+    WITCH_SAVE = 4  # witch save someone
+    GUARD_PROTECT = 5  # guard protect someone
+    PROGRESS_STEP = 6  # step increment
+
+
+class EnvAction(BaseEnvAction):
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+
+    action_type: int = Field(default=EnvActionType.NONE, description="action type")
+    player_name: str = Field(default="", description="the name of the player to do the action")
+    target_player_name: str = Field(default="", description="the name of the player who take the action")
+
+
+def get_observation_space() -> spaces.Dict:
+    space = spaces.Dict(
+        {
+            "game_setup": spaces.Text(256),
+            "step_idx": spaces.Discrete(len(STEP_INSTRUCTIONS)),
+            "living_players": spaces.Tuple(
+                (spaces.Text(16), spaces.Text(16))
+            ),  # TODO should be tuple of variable length
+            "werewolf_players": spaces.Tuple(
+                (spaces.Text(16), spaces.Text(16))
+            ),  # TODO should be tuple of variable length
+            "player_hunted": spaces.Text(16),
+            "player_current_dead": spaces.Tuple((spaces.Text(16))),  # TODO should be tuple of variable length
+            "witch_poison_left": spaces.Discrete(2),
+            "witch_antidote_left": spaces.Discrete(2),
+            "winner": spaces.Text(16),
+            "win_reason": spaces.Text(64),
+        }
+    )
+    return space
+
+
+def get_action_space() -> spaces.Dict:
+    space = spaces.Dict(
+        {
+            "action_type": spaces.Discrete(len(EnvActionType)),
+            "player_name": spaces.Text(16),  # the player to do the action
+            "target_player_name": spaces.Text(16),  # the target player who take the action
+        }
+    )
+    return space
diff --git a/metagpt/environment/werewolf/werewolf_env.py b/metagpt/environment/werewolf/werewolf_env.py
new file mode 100644
index 0000000000..999ff63a1c
--- /dev/null
+++ b/metagpt/environment/werewolf/werewolf_env.py
@@ -0,0 +1,41 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : MG Werewolf Env
+
+from typing import Iterable
+
+from pydantic import Field
+
+from metagpt.environment.base_env import Environment
+from metagpt.environment.werewolf.werewolf_ext_env import WerewolfExtEnv
+from metagpt.schema import Message
+
+
+class WerewolfEnv(WerewolfExtEnv, Environment):
+    round_cnt: int = Field(default=0)
+
+    def add_roles(self, roles: Iterable["Role"]):
+        """增加一批在当前环境的角色
+        Add a batch of characters in the current environment
+        """
+        for role in roles:
+            self.roles[role.name] = role  # use name as key here, due to multi-player can have same profile
+
+        for role in roles:  # setup system message with roles
+            role.context = self.context
+            role.set_env(self)
+
+    def publish_message(self, message: Message, add_timestamp: bool = True):
+        """Post information to the current environment"""
+        if add_timestamp:
+            # Because the content of the message may be repeated, for example, killing the same person in two nights
+            # Therefore, a unique round_cnt prefix needs to be added so that the same message will not be automatically deduplicated when added to the memory.
+            message.content = f"{self.round_cnt} | " + message.content
+        super().publish_message(message)
+
+    async def run(self, k=1):
+        """Process all Role runs by order"""
+        for _ in range(k):
+            for role in self.roles.values():
+                await role.run()
+            self.round_cnt += 1
diff --git a/metagpt/environment/werewolf_env/werewolf_ext_env.py b/metagpt/environment/werewolf/werewolf_ext_env.py
similarity index 54%
rename from metagpt/environment/werewolf_env/werewolf_ext_env.py
rename to metagpt/environment/werewolf/werewolf_ext_env.py
index 7c4b4c475a..a8636536b1 100644
--- a/metagpt/environment/werewolf_env/werewolf_ext_env.py
+++ b/metagpt/environment/werewolf/werewolf_ext_env.py
@@ -4,109 +4,27 @@
 
 import random
 from collections import Counter
-from enum import Enum
-from typing import Callable, Optional
+from typing import Any, Callable, Optional
 
 from pydantic import ConfigDict, Field
 
 from metagpt.environment.base_env import ExtEnv, mark_as_readable, mark_as_writeable
+from metagpt.environment.base_env_space import BaseEnvObsParams
+from metagpt.environment.werewolf.const import STEP_INSTRUCTIONS, RoleState, RoleType
+from metagpt.environment.werewolf.env_space import EnvAction, EnvActionType
 from metagpt.logs import logger
 
 
-class RoleState(Enum):
-    ALIVE = "alive"  # the role is alive
-    KILLED = "killed"  # the role is killed by werewolf or voting
-    POISONED = "poisoned"  # the role is killed by posion
-    SAVED = "saved"  # the role is saved by antidote
-
-
-# the ordered rules by the moderator to announce to everyone each step
-STEP_INSTRUCTIONS = {
-    0: {
-        "content": "It’s dark, everyone close your eyes. I will talk with you/your team secretly at night.",
-        "send_to": "Moderator",  # for moderator to continuen speaking
-        "restricted_to": "",
-    },
-    1: {
-        "content": "Guard, please open your eyes!",
-        "send_to": "Moderator",  # for moderator to continuen speaking
-        "restricted_to": "",
-    },
-    2: {
-        "content": """Guard, now tell me who you protect tonight?
-                   You only choose one from the following living options please: {living_players}.
-                   Or you can pass. For example: Protect ...""",
-        "send_to": "Guard",
-        "restricted_to": "Moderator,Guard",
-    },
-    3: {"content": "Guard, close your eyes", "send_to": "Moderator", "restricted_to": ""},
-    4: {"content": "Werewolves, please open your eyes!", "send_to": "Moderator", "restricted_to": ""},
-    5: {
-        "content": """Werewolves, I secretly tell you that {werewolf_players} are
-                   all of the 2 werewolves! Keep in mind you are teammates. The rest players are not werewolves.
-                   choose one from the following living options please:
-                   {living_players}. For example: Kill ...""",
-        "send_to": "Werewolf",
-        "restricted_to": "Moderator,Werewolf",
-    },
-    6: {"content": "Werewolves, close your eyes", "send_to": "Moderator", "restricted_to": ""},
-    7: {"content": "Witch, please open your eyes!", "send_to": "Moderator", "restricted_to": ""},
-    8: {
-        "content": """Witch, tonight {player_hunted} has been killed by the werewolves.
-                   You have a bottle of antidote, would you like to save him/her? If so, say "Save", else, say "Pass".""",
-        "send_to": "Witch",
-        "restricted_to": "Moderator,Witch",
-    },  # 要先判断女巫是否有解药，再去询问女巫是否使用解药救人
-    9: {
-        "content": """Witch, you also have a bottle of poison, would you like to use it to kill one of the living players?
-                   Choose one from the following living options: {living_players}.
-                   If so, say ONLY "Poison PlayerX", replace PlayerX with the actual player name, else, say "Pass".""",
-        "send_to": "Witch",
-        "restricted_to": "Moderator,Witch",
-    },  #
-    10: {"content": "Witch, close your eyes", "send_to": "Moderator", "restricted_to": ""},
-    11: {"content": "Seer, please open your eyes!", "send_to": "Moderator", "restricted_to": ""},
-    12: {
-        "content": """Seer, you can check one player's identity. Who are you going to verify its identity tonight?
-                    Choose only one from the following living options:{living_players}.""",
-        "send_to": "Seer",
-        "restricted_to": "Moderator,Seer",
-    },
-    13: {"content": "Seer, close your eyes", "send_to": "Moderator", "restricted_to": ""},
-    # The 1-st daytime
-    14: {
-        "content": """It's daytime. Everyone woke up except those who had been killed.""",
-        "send_to": "Moderator",
-        "restricted_to": "",
-    },
-    15: {"content": "{player_current_dead} was killed last night!", "send_to": "Moderator", "restricted_to": ""},
-    16: {
-        "content": """Living players: {living_players}, now freely talk about the current situation based on your observation and
-                    reflection with a few sentences. Decide whether to reveal your identity based on your reflection.""",
-        "send_to": "",  # send to all to speak in daytime
-        "restricted_to": "",
-    },
-    17: {
-        "content": """Now vote and tell me who you think is the werewolf. Don’t mention your role.
-                    You only choose one from the following living options please:
-                    {living_players}. Say ONLY: I vote to eliminate ...""",
-        "send_to": "",
-        "restricted_to": "",
-    },
-    18: {"content": """{player_current_dead} was eliminated.""", "send_to": "Moderator", "restricted_to": ""},
-}
-
-
 class WerewolfExtEnv(ExtEnv):
     model_config = ConfigDict(arbitrary_types_allowed=True)
 
     players_state: dict[str, tuple[str, RoleState]] = Field(
-        default=dict(), description="the player's role type and state by player_name"
+        default_factory=dict, description="the player's role type and state by player_name"
     )
 
     round_idx: int = Field(default=0)  # the current round
     step_idx: int = Field(default=0)  # the current step of current round
-    eval_step_idx: int = Field(default=0)
+    eval_step_idx: list[int] = Field(default=[])
     per_round_steps: int = Field(default=len(STEP_INSTRUCTIONS))
 
     # game global states
@@ -114,13 +32,13 @@ class WerewolfExtEnv(ExtEnv):
     special_role_players: list[str] = Field(default=[])
     winner: Optional[str] = Field(default=None)
     win_reason: Optional[str] = Field(default=None)
-    witch_poison_left: int = Field(default=1)
-    witch_antidote_left: int = Field(default=1)
+    witch_poison_left: int = Field(default=1, description="should be 1 or 0")
+    witch_antidote_left: int = Field(default=1, description="should be 1 or 0")
 
     # game current round states, a round is from closing your eyes to the next time you close your eyes
-    round_hunts: dict[str, str] = Field(default=dict(), description="nighttime wolf hunt result")
+    round_hunts: dict[str, str] = Field(default_factory=dict, description="nighttime wolf hunt result")
     round_votes: dict[str, str] = Field(
-        default=dict(), description="daytime all players vote result, key=voteer, value=voted one"
+        default_factory=dict, description="daytime all players vote result, key=voter, value=voted one"
     )
     player_hunted: Optional[str] = Field(default=None)
     player_protected: Optional[str] = Field(default=None)
@@ -128,6 +46,76 @@ class WerewolfExtEnv(ExtEnv):
     player_poisoned: Optional[str] = Field(default=None)
     player_current_dead: list[str] = Field(default=[])
 
+    def reset(
+        self,
+        *,
+        seed: Optional[int] = None,
+        options: Optional[dict[str, Any]] = None,
+    ) -> tuple[dict[str, Any], dict[str, Any]]:
+        """currently unused"""
+        pass
+
+    def observe(self, obs_params: Optional[BaseEnvObsParams] = None) -> Any:
+        """currently unused"""
+        pass
+
+    def _get_obs(self):
+        return {
+            "game_setup": self.game_setup,
+            "step_idx": self.step_idx,
+            "living_players": self.living_players,
+            "werewolf_players": self.werewolf_players,  # currently, lack observation isolation
+            "player_hunted": self.player_hunted,
+            "player_current_dead": self.player_current_dead,
+            "witch_poison_left": self.witch_poison_left,
+            "witch_antidote_left": self.witch_antidote_left,
+            "winner": self.winner,
+            "win_reason": self.win_reason,
+        }
+
+    def step(self, action: EnvAction) -> tuple[dict[str, Any], float, bool, bool, dict[str, Any]]:
+        action_type = action.action_type
+        player_name = action.player_name
+        target_player_name = action.target_player_name
+        if action_type == EnvActionType.WOLF_KILL:
+            self.wolf_kill_someone(wolf_name=player_name, player_name=target_player_name)
+        elif action_type == EnvActionType.VOTE_KILL:
+            self.vote_kill_someone(voter_name=player_name, player_name=target_player_name)
+        elif action_type == EnvActionType.WITCH_POISON:
+            self.witch_poison_someone(witch_name=player_name, player_name=target_player_name)
+        elif action_type == EnvActionType.WITCH_SAVE:
+            self.witch_save_someone(witch_name=player_name, player_name=target_player_name)
+        elif action_type == EnvActionType.GUARD_PROTECT:
+            self.guard_protect_someone(guard_name=player_name, player_name=target_player_name)
+        elif action_type == EnvActionType.PROGRESS_STEP:
+            self.progress_step()
+        elif action_type == EnvActionType.NONE:
+            pass
+        else:
+            raise ValueError(f"not supported action_type: {action_type}")
+
+        self.update_game_states()
+        terminated = self._check_game_finish()
+        obs = self._get_obs()
+        return obs, 1.0, terminated, False, {}
+
+    def _check_game_finish(self) -> bool:
+        """return True if game finished else False"""
+        # game's termination condition
+        terminated = False
+        living_werewolf = [p for p in self.werewolf_players if p in self.living_players]
+        living_villagers = [p for p in self.villager_players if p in self.living_players]
+        living_special_roles = [p for p in self.special_role_players if p in self.living_players]
+        if not living_werewolf:
+            self.winner = "good guys"
+            self.win_reason = "werewolves all dead"
+            terminated = True
+        elif not living_villagers or not living_special_roles:
+            self.winner = "werewolf"
+            self.win_reason = "villagers all dead" if not living_villagers else "special roles all dead"
+            terminated = True
+        return terminated
+
     @property
     def living_players(self) -> list[str]:
         player_names = []
@@ -146,12 +134,12 @@ def _role_type_players(self, role_type: str) -> list[str]:
 
     @property
     def werewolf_players(self) -> list[str]:
-        player_names = self._role_type_players(role_type="Werewolf")
+        player_names = self._role_type_players(role_type=RoleType.WEREWOLF.value)
         return player_names
 
     @property
     def villager_players(self) -> list[str]:
-        player_names = self._role_type_players(role_type="Villager")
+        player_names = self._role_type_players(role_type=RoleType.VILLAGER.value)
         return player_names
 
     def _init_players_state(self, players: list["Role"]):
@@ -178,14 +166,14 @@ def init_game_setup(
         """init players using different roles' num"""
         role_objs = []
         for role_obj in role_uniq_objs:
-            if str(role_obj) == "Villager":
+            if RoleType.VILLAGER.value in str(role_obj):
                 role_objs.extend([role_obj] * num_villager)
-            elif str(role_obj) == "Werewolf":
+            elif RoleType.WEREWOLF.value in str(role_obj):
                 role_objs.extend([role_obj] * num_werewolf)
             else:
                 role_objs.append(role_obj)
         if shuffle:
-            random.shuffle(len(role_objs))
+            random.shuffle(role_objs)
         if add_human:
             assigned_role_idx = random.randint(0, len(role_objs) - 1)
             assigned_role = role_objs[assigned_role_idx]
@@ -218,10 +206,12 @@ def _update_players_state(self, player_names: list[str], state: RoleState = Role
                 roletype_state = self.players_state[player_name]
                 self.players_state[player_name] = (roletype_state[0], state)
 
-    def _check_valid_role(self, player: "Role", role_type: str) -> bool:
-        return True if role_type in str(player) else False
+    def _check_valid_role(self, player_name: str, role_type: str) -> bool:
+        roletype_state = self.players_state.get(player_name)
+        return True if roletype_state and role_type in roletype_state[0] else False
 
     def _check_player_continue(self, player_name: str, particular_step: int = -1) -> bool:
+        """to check if can do the operation to the player"""
         step_idx = self.step_idx % self.per_round_steps
         if particular_step > 0 and step_idx != particular_step:  # step no
             # particular_step = 18, not daytime vote time, ignore
@@ -238,6 +228,10 @@ def curr_step_instruction(self) -> dict:
         self.step_idx += 1
         return instruction
 
+    @mark_as_writeable
+    def progress_step(self):
+        self.step_idx += 1
+
     @mark_as_readable
     def get_players_state(self, player_names: list[str]) -> dict[str, RoleState]:
         players_state = {
@@ -248,57 +242,72 @@ def get_players_state(self, player_names: list[str]) -> dict[str, RoleState]:
         return players_state
 
     @mark_as_writeable
-    def vote_kill_someone(self, voteer: "Role", player_name: str = None):
+    def vote_kill_someone(self, voter_name: str, player_name: str = None):
         """player vote result at daytime
         player_name: if it's None, regard as abstaining from voting
         """
-        if not self._check_player_continue(voteer.name, particular_step=18):  # 18=step no
+        if not self._check_player_continue(voter_name, particular_step=18):  # 18=step no
             return
 
-        self.round_votes[voteer.name] = player_name
+        self.round_votes[voter_name] = player_name
         # check if all living players finish voting, then get the dead one
         if list(self.round_votes.keys()) == self.living_players:
             voted_all = list(self.round_votes.values())  # TODO in case of tie vote, check who was voted first
             voted_all = [item for item in voted_all if item]
-            self.player_current_dead = Counter(voted_all).most_common()[0][0]
-            self._update_players_state([self.player_current_dead])
+            self.player_current_dead = [Counter(voted_all).most_common()[0][0]]
+            self._update_players_state(self.player_current_dead)
 
     @mark_as_writeable
-    def wolf_kill_someone(self, wolf: "Role", player_name: str):
-        if not self._check_valid_role(wolf, "Werewolf"):
+    def wolf_kill_someone(self, wolf_name: str, player_name: str):
+        if not self._check_valid_role(wolf_name, RoleType.WEREWOLF.value):
             return
-        if not self._check_player_continue(wolf.name, particular_step=5):  # 5=step no
+        if not self._check_player_continue(wolf_name, particular_step=6):  # 5=step no
             return
 
-        self.round_hunts[wolf.name] = player_name
-        living_werewolf = [p for p in self.werewolf_players if p in self.living_players]
+        self.round_hunts[wolf_name] = player_name
+        # living_werewolf = [p for p in self.werewolf_players if p in self.living_players]
         # check if all living wolfs finish hunting, then get the hunted one
-        if list(self.round_hunts.keys()) == living_werewolf:
-            hunted_all = list(self.round_hunts.values())
-            self.player_hunted = Counter(hunted_all).most_common()[0][0]
-
-    @mark_as_writeable
-    def witch_poison_someone(self, witch: "Role", player_name: str = None):
-        if not self._check_valid_role(witch, "Witch"):
+        # if list(self.round_hunts.keys()) == living_werewolf:
+        #     hunted_all = list(self.round_hunts.values())
+        #     self.player_hunted = Counter(hunted_all).most_common()[0][0]
+        self.player_hunted = player_name
+
+    def _witch_poison_or_save_someone(
+        self, witch_name: str, player_name: str = None, state: RoleState = RoleState.POISONED
+    ):
+        if not self._check_valid_role(witch_name, RoleType.WITCH.value):
             return
         if not self._check_player_continue(player_name):
             return
 
-        self._update_players_state([player_name], RoleState.POISONED)
-        self.player_poisoned = player_name
+        assert state in [RoleState.POISONED, RoleState.SAVED]
+        self._update_players_state([player_name], state)
+        if state == RoleState.POISONED:
+            self.player_poisoned = player_name
+            self.witch_poison_left -= 1
+        else:
+            # self.player_protected = player_name
+            self.is_hunted_player_saved = True
+            self.witch_antidote_left -= 1
 
     @mark_as_writeable
-    def witch_save_someone(self, witch: "Role", player_name: str = None):
-        if not self._check_valid_role(witch, "Witch"):
+    def witch_poison_someone(self, witch_name: str, player_name: str = None):
+        self._witch_poison_or_save_someone(witch_name, player_name, RoleState.POISONED)
+
+    @mark_as_writeable
+    def witch_save_someone(self, witch_name: str, player_name: str = None):
+        self._witch_poison_or_save_someone(witch_name, player_name, RoleState.SAVED)
+
+    @mark_as_writeable
+    def guard_protect_someone(self, guard_name: str, player_name: str = None):
+        if not self._check_valid_role(guard_name, RoleType.GUARD.value):
             return
         if not self._check_player_continue(player_name):
             return
-
-        self._update_players_state([player_name], RoleState.SAVED)
         self.player_protected = player_name
 
     @mark_as_writeable
-    def update_game_states(self, memories: list):
+    def update_game_states(self):
         step_idx = self.step_idx % self.per_round_steps
         if step_idx not in [15, 18] or self.step_idx in self.eval_step_idx:
             return
@@ -314,22 +323,12 @@ def update_game_states(self, memories: list):
             if self.player_poisoned:
                 self.player_current_dead.append(self.player_poisoned)
 
-            self._update_players_state([self.player_current_dead])
+            self._update_players_state(self.player_current_dead)
             # reset
             self.player_hunted = None
             self.player_protected = None
             self.is_hunted_player_saved = False
             self.player_poisoned = None
-
-        # game's termination condition
-        living_werewolf = [p for p in self.werewolf_players if p in self.living_players]
-        living_villagers = [p for p in self.villager_players if p in self.living_players]
-        living_special_roles = [p for p in self.special_role_players if p in self.living_players]
-        if not living_werewolf:
-            self.winner = "good guys"
-            self.win_reason = "werewolves all dead"
-        elif not living_villagers or not living_special_roles:
-            self.winner = "werewolf"
-            self.win_reason = "villagers all dead" if not living_villagers else "special roles all dead"
-        if self.winner is not None:
-            self._record_all_experiences()  # TODO
+        elif step_idx == 18:
+            # updated use vote_kill_someone
+            pass
diff --git a/metagpt/environment/werewolf_env/werewolf_env.py b/metagpt/environment/werewolf_env/werewolf_env.py
deleted file mode 100644
index d174f322ca..0000000000
--- a/metagpt/environment/werewolf_env/werewolf_env.py
+++ /dev/null
@@ -1,31 +0,0 @@
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-# @Desc   : MG Werewolf Env
-
-from pydantic import Field
-
-from metagpt.environment.base_env import Environment
-from metagpt.environment.werewolf_env.werewolf_ext_env import WerewolfExtEnv
-from metagpt.logs import logger
-from metagpt.schema import Message
-
-
-class WerewolfEnv(Environment, WerewolfExtEnv):
-    timestamp: int = Field(default=0)
-
-    def publish_message(self, message: Message, add_timestamp: bool = True):
-        """Post information to the current environment"""
-        logger.debug(f"publish_message: {message.dump()}")
-        if add_timestamp:
-            # Because the content of the message may be repeated, for example, killing the same person in two nights
-            # Therefore, a unique timestamp prefix needs to be added so that the same message will not be automatically deduplicated when added to the memory.
-            message.content = f"{self.timestamp} | " + message.content
-        self.memory.add(message)
-        self.history += f"\n{message}"
-
-    async def run(self, k=1):
-        """Process all Role runs by order"""
-        for _ in range(k):
-            for role in self.roles.values():
-                await role.run()
-            self.timestamp += 1
diff --git a/metagpt/ext/__init__.py b/metagpt/ext/__init__.py
new file mode 100644
index 0000000000..2bcf8efd09
--- /dev/null
+++ b/metagpt/ext/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/metagpt/ext/android_assistant/README.md b/metagpt/ext/android_assistant/README.md
new file mode 100644
index 0000000000..fe8b4b3e32
--- /dev/null
+++ b/metagpt/ext/android_assistant/README.md
@@ -0,0 +1,118 @@
+# MetaGPT Android Assistant
+
+The MetaGPT Android Assistant is an intelligent assistance tool driven by a multi-modal large language model based on the advanced MetaGPT framework.  It has the ability to self-learn, mastering users' daily usage patterns through learning, and can automatically complete various application operations according to user instructions, achieving comprehensive liberation of users' hands.
+Next, we will introduce the functions of the MetaGPT Android Assistant and how to use it.
+
+## Features
+
+The operation of the MetaGPT Android Assistant mainly includes two stages: learning and automatic execution. Below, we introduce the specific features of the MetaGPT Android Assistant from these two stages.
+
+### Learning Stage
+
+By learning from human demonstrations or exploring apps based on human instructions, the MetaGPT Android Assistant can learn the functionality of apps, generate corresponding operation documents for use in the subsequent "automatic execution" stage. Approximately 20 rounds of exploration for any given task objective can significantly improve performance.
+
+By setting the `stage` to `learn`, you can ask the Android Assistant to enter the learning stage. By setting the `mode` to `auto`, you can instruct the Android Assistant to learn through automatic exploration; by setting the mode to manual, you can instruct the Android Assistant to learn through human manual demonstration. In the usage section, we provide detailed explanations of the script parameters. You can try experimenting with automatic exploration and manual demonstration modes on the "Messenger" app with the following commands:
+
+```bash
+cd examples/android_assistant
+python run_assistant.py "Send 'When will we release this feature?' to +86 8888888" --stage "learn" --mode "auto or manual" --app-name "Messenger"
+```
+
+#### Learning Based on Human Demonstration
+When asking the Android Assistant to perform self-exploration during the learning stage, you can free your hands. However, when instructing it to learn according to your commands, you need to follow the instructions in the terminal for the Android Assistant to accurately learn your operation methods.
+A possible example is as follows:
+
+```bash
+cd examples/android_assistant
+python run_assistant.py "Send 'When will we release this feature?' to +86 8888888" --stage "learn" --mode "manual" --app-name "Messenger"
+```
+
+After running this command, you will first see a screenshot of an Android screen that has been marked at various interactive locations, as shown in the figure below:
+
+<img src="./resources/manual_example.png" width = 30%>
+
+After remembering the location where you want to operate, a request similar to the one below will be output in the terminal. Reply to it and thereby direct the Android assistant to learn your demonstration action:
+
+```bash
+| INFO     | examples.android_assistant.actions.manual_record:run:96 - Which element do you want to tap? Choose a numeric tag from 1 to 11:
+user_input: 8
+| INFO     | examples.android_assistant.actions.manual_record:run:81 - Choose one of the following actions you want to perform on the current screen:
+tap, text, long_press, swipe, stop
+user_input: tap
+```
+
+### Automatic Execution Stage
+After the Android Assistant completes the learning stage, you can command it to complete tasks on the phone through text descriptions. By configuring the operation documents from the self-learning stage, the Android Assistant has richer prior knowledge, and its execution capabilities are further enhanced.
+You can instruct the Android Assistant to send messages in the "Messenger" app with the following command:
+```bash
+python run_assistant.py "Send 'When will we release this feature?' to +86 8888888" --stage "act" --mode "auto or manual" --app-name "Messenger"
+```
+Specifically, by selecting `auto` for `mode`, the Android assistant will employ the operational records compiled through self-exploration. Alternatively, if `manual` is chosen as the `mode`, the Android assistant will leverage the operation manuals accrued from learning via human demonstration.
+
+## Installation
+To use the Android Assistant, you first need to meet the following conditions:
+1. Complete the installation of the MetaGPT environment.
+2. Install [Android Debug Bridge (ADB)](https://developer.android.com/tools/adb?hl=zh-cn) on your PC, which enables interaction between your PC and Android devices.
+3. Install Android Studio and within it, install the Android emulator to provide an environment for the Android Assistant to learn and execute. For information on how to install the Android emulator, refer to [Quick Installation of Android Studio & Emulator](https://docs.expo.dev/workflow/android-studio-emulator/).
+4. (Optional) Connect your Android device to the USB port of your PC, which can also provide an environment for the Android Assistant to learn and execute.
+
+Note ⚠️: When operating with the Android emulator, the emulator model we use is Medium Phone, which is recommended for first-time users to complete the operation.
+
+After completing these operations, you can enter the following command to check if ADB is installed successfully and if the Android device is connected:
+```bash
+adb devices
+```
+
+## Usage
+The MetaGPT Android Assistant is designed within the MetaGPT framework as a collection of Roles and multiple Actions. You can run it by executing the `run_assistant.py` script. The specific parameter description of this script is as follows:
+```text
+Usage: run_assistant.py [OPTIONS] TASK_DESC
+
+  Run a Android Assistant
+
+Arguments:
+  TASK_DESC  the task description you want the android assistant to learn or
+             act  [required]
+
+Options:
+  --n-round INTEGER               The max round to do an app operation task.
+                                  [default: 20]
+  --stage TEXT                    stage: learn / act  [default: learn]
+  --mode TEXT                     mode: auto / manual , when state=learn
+                                  [default: auto]
+  --app-name TEXT                 the name of app you want to run  [default:
+                                  demo]
+  --investment FLOAT              Dollar amount to invest in the AI company.
+                                  [default: 5.0]
+  --refine-doc / --no-refine-doc  Refine existing operation docs based on the
+                                  latest observation if True.  [default: no-
+                                  refine-doc]
+  --min-dist INTEGER              The minimum distance between elements to
+                                  prevent overlapping during the labeling
+                                  process.  [default: 30]
+  --android-screenshot-dir TEXT   The path to store screenshots on android
+                                  device. Make sure it exists.  [default:
+                                  /sdcard/Pictures/Screenshots]
+  --android-xml-dir TEXT          The path to store xml files for determining
+                                  UI elements localtion. Make sure it exists.
+                                  [default: /sdcard]
+  --device-id TEXT                The Android device_id  [default:
+                                  emulator-5554]
+  --help                          Show this message and exit.
+```
+
+## Acknowledgements
+The MetaGPT Android Assistant has referenced some ideas and code from the [AppAgent](https://github.com/mnotgod96/AppAgent) project. We thank the developers of the Appagent project.
+
+### Citation
+
+```bib
+@misc{yang2023appagent,
+      title={AppAgent: Multimodal Agents as Smartphone Users}, 
+      author={Chi Zhang and Zhao Yang and Jiaxuan Liu and Yucheng Han and Xin Chen and Zebiao Huang and Bin Fu and Gang Yu},
+      year={2023},
+      eprint={2312.13771},
+      archivePrefix={arXiv},
+      primaryClass={cs.CV}
+}
+```
\ No newline at end of file
diff --git a/metagpt/ext/android_assistant/README_CN.md b/metagpt/ext/android_assistant/README_CN.md
new file mode 100644
index 0000000000..a1abbe3b0b
--- /dev/null
+++ b/metagpt/ext/android_assistant/README_CN.md
@@ -0,0 +1,113 @@
+# MetaGPT 安卓助理
+
+MetaGPT安卓助理是一款依托于先进的MetaGPT框架构建的多模态大语言模型驱动的智能辅助工具。
+它具备自我学习的能力，能够通过学习掌握用户的日常使用方式，同时能够根据用户的指令自动完成各类应用程序的操作任务，实现了用户双手的全面解放。
+接下来，我们将介绍MetaGPT安卓助理的功能以及如何使用它。
+
+## 功能
+
+MetaGPT 安卓助理的执行主要包含两个阶段，分别为自我学习与自动执行。下面，我们将从这两个阶段介绍MetaGPT 安卓助理的具体功能。
+
+### 自我学习阶段
+
+通过学习人类演示或基于人类指令对app进行探索，MetaGPT安卓助理可以对app的功能进行学习，生成相应的操作文档，为后续的“自动执行”阶段使用。对于任何给定的任务目标，进行约20轮的探索可以显著提高性能。
+
+通过设定`stage`为`learn`可要求安卓助理进入自我学习阶段。通过设定`mode`为`auto`，可要求安卓助理通过自动探索学习，通过设定`mode`为`manual`，可要求安卓助理通过人类手动演示学习。在使用章节，我们对脚本的参数进行了详细的说明。
+您可以尝试对“Messenger”应用程序进行自动探索和手动演示模式的实验，具体命令如下：
+
+```bash
+cd examples/android_assistant
+python run_assistant.py "Send 'When will we release this feature? to +86 8888888'" --stage "learn" --mode "auto or manual" --app-name "Messenger"
+```
+
+#### 基于人类演示的学习
+在要求安卓助理在自我学习阶段执行自我探索时，您可以解放您的双手，但在要求他根据您的指令进行学习时，你需要根据终端中的指令进行输入，以便安卓助理能够准确地学习您的操作方式。
+一个可能的例子如下：
+
+```bash
+cd examples/android_assistant
+python run_assistant.py "Send 'When will we release this feature? to +86 8888888'" --stage "learn" --mode "manual" --app-name "Messenger"
+```
+
+在运行这一指令后，你将首先看到一个在各个可交互的位置进行了标记的安卓屏幕的截图，如下图：
+
+<img src="./resources/manual_example.png" width = 30%>
+
+在记住你要操作的位置之后，终端中将会输出与下面类似的要求，回复它，进而指挥安卓助理学习你的演示行为：
+
+```bash
+| INFO     | examples.android_assistant.actions.manual_record:run:96 - Which element do you want to tap? Choose a numeric tag from 1 to 11:
+user_input: 8
+| INFO     | examples.android_assistant.actions.manual_record:run:81 - Choose one of the following actions you want to perform on the current screen:
+tap, text, long_press, swipe, stop
+user_input: tap
+```
+### 自动执行阶段
+在安卓助理完成了自我学习阶段之后，您可以通过文本描述的方式，指挥安卓助理在手机中完成任务。通过为其配置自我学习阶段的操作文档，安卓助理具备了更丰富的前置知识，执行能力进一步得到提升。
+你可以通过以下指令，指挥安卓助理在“Messenger”应用中发送信息：
+```bash
+python run_assistant.py "Send 'When will we release this feature? to +86 8888888'" --stage "act" --mode "auto or manual" --app-name "Messenger"
+```
+其中，`mode`选择`auto`，安卓助理将使用自我探索中积累的操作文档；`mode`选择`manual`，安卓助理将使用人类演示学习中积累的操作文档。
+
+## 安装
+为了使用安卓助理，你首先需要满足以下条件：
+1. 完成MetaGPT环境的安装
+2. 在你的PC上安装[Android Debug Bridge(ADB)](https://developer.android.com/tools/adb?hl=zh-cn)，ADB可以使你的PC与安卓设备进行交互。
+3. 安装Android Studio，在其中安装Android模拟器，以为安卓助手提供学习与执行的环境。关于如何安装Android模拟器，可以参考[快速安装Android Studio & Emulator](https://dev.weixin.qq.com/docs/framework/dev/framework/env/android-simulator.html)。
+4. (Optional) 将你的安卓设备连接到PC的USB端口上，这同样可以为安卓助手提供学习与执行的环境。
+
+注意 ⚠️：在使用Android模拟器进行操作时，我们使用的模拟器型号为Medium Phone，建议第一次尝试此类应用的用户使用这一型号完成操作。
+
+在完成这一系列操作之后，你可以输入以下命令检查ADB是否安装成功，以及安卓设备是否连接
+```bash
+adb devices
+```
+## 使用
+MetaGPT 安卓助理在MetaGPT框架中被设计为一个`Role`与多个`Action`的集合，你可以通过运行`run_assistant.py`脚本来运行它。这一脚本具体的参数说明如下：
+```text
+用法：run_assistant.py [选项] 任务描述
+
+  运行一个安卓助手
+
+参数：
+  TASK_DESC  你希望安卓助手学习或执行的任务描述
+              [必需]
+
+选项：
+  --n-round 整数               执行应用程序操作任务的最大轮数。
+                                  [默认值：20]
+  --stage 文本                   阶段：learn/act  [默认值：learn]
+  --mode 文本                    模式：auto/manual，当状态=learn时 [默认值：auto]
+  --app-name 文本                你想要运行的应用程序名称  [默认值：
+                                  演示]
+  --investment 浮点数             投资于人工智能公司的美元金额。
+                                  [默认值：5.0]
+  --refine-doc / --no-refine-doc  如果为真，则根据最新的观察结果优化现有操作文档。
+                                  [默认值：--no-refine-doc]
+  --min-dist 整数              在标记过程中防止元素重叠的最小元素间距。
+                                  [默认值：30]
+  --android-screenshot-dir 文本  在安卓设备上存储截图的路径。确保其存在。
+                                  [默认值：/sdcard/Pictures/Screenshots]
+  --android-xml-dir 文本         存储用于确定UI元素位置的XML文件的路径。
+                                  确保其存在。[默认值：/sdcard]
+  --device-id 文本               安卓device_id  [默认值：
+                                  模拟器-5554]
+  --help                          显示此信息并退出。
+```
+
+## 致谢
+MetaGPT 安卓助理参考了 [AppAgent](https://github.com/mnotgod96/AppAgent) 项目的部分思路与代码，感谢 Appagent 项目的开发者们。
+
+### 引用
+
+```bib
+@misc{yang2023appagent,
+      title={AppAgent: Multimodal Agents as Smartphone Users}, 
+      author={Chi Zhang and Zhao Yang and Jiaxuan Liu and Yucheng Han and Xin Chen and Zebiao Huang and Bin Fu and Gang Yu},
+      year={2023},
+      eprint={2312.13771},
+      archivePrefix={arXiv},
+      primaryClass={cs.CV}
+}
+```
\ No newline at end of file
diff --git a/metagpt/ext/android_assistant/__init__.py b/metagpt/ext/android_assistant/__init__.py
new file mode 100644
index 0000000000..2bcf8efd09
--- /dev/null
+++ b/metagpt/ext/android_assistant/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/metagpt/ext/android_assistant/actions/__init__.py b/metagpt/ext/android_assistant/actions/__init__.py
new file mode 100644
index 0000000000..2bcf8efd09
--- /dev/null
+++ b/metagpt/ext/android_assistant/actions/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/metagpt/ext/android_assistant/actions/manual_record.py b/metagpt/ext/android_assistant/actions/manual_record.py
new file mode 100644
index 0000000000..bcfb2ed893
--- /dev/null
+++ b/metagpt/ext/android_assistant/actions/manual_record.py
@@ -0,0 +1,168 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : manual record user interaction in stage=learn & mode=manual, LIKE scripts/step_recorder.py
+import time
+from pathlib import Path
+
+import cv2
+
+from metagpt.actions.action import Action
+from metagpt.config2 import config
+from metagpt.environment.android.android_env import AndroidEnv
+from metagpt.environment.android.const import ADB_EXEC_FAIL
+from metagpt.environment.android.env_space import (
+    EnvAction,
+    EnvActionType,
+    EnvObsParams,
+    EnvObsType,
+)
+from metagpt.ext.android_assistant.utils.schema import (
+    ActionOp,
+    AndroidActionOutput,
+    RunState,
+    SwipeOp,
+)
+from metagpt.ext.android_assistant.utils.utils import (
+    draw_bbox_multi,
+    elem_list_from_xml_tree,
+)
+from metagpt.logs import logger
+
+
+class ManualRecord(Action):
+    """do a human operation on the screen with human input"""
+
+    name: str = "ManualRecord"
+
+    useless_list: list[str] = []  # store useless elements uid
+    record_path: Path = ""
+    task_desc_path: Path = ""
+    screenshot_before_path: Path = ""
+    screenshot_after_path: Path = ""
+    xml_path: Path = ""
+
+    async def run(self, task_desc: str, task_dir: Path, env: AndroidEnv):
+        self.record_path = Path(task_dir) / "record.txt"
+        self.task_desc_path = Path(task_dir) / "task_desc.txt"
+        self.screenshot_before_path = Path(task_dir) / "raw_screenshots"
+        self.screenshot_after_path = Path(task_dir) / "labeled_screenshots"
+        self.xml_path = Path(task_dir) / "xml"
+        for path in [self.screenshot_before_path, self.screenshot_after_path, self.xml_path]:
+            path.mkdir(parents=True, exist_ok=True)
+
+        self.record_path.write_text("")
+        record_file = open(self.record_path, "w")
+        self.task_desc_path.write_text(task_desc)
+
+        step = 0
+        extra_config = config.extra
+        while True:
+            step += 1
+            screenshot_path: Path = env.observe(
+                EnvObsParams(
+                    obs_type=EnvObsType.GET_SCREENSHOT, ss_name=f"{step}", local_save_dir=self.screenshot_before_path
+                )
+            )
+            xml_path: Path = env.observe(
+                EnvObsParams(obs_type=EnvObsType.GET_XML, xml_name=f"{step}", local_save_dir=self.xml_path)
+            )
+            if not screenshot_path.exists() or not xml_path.exists():
+                return AndroidActionOutput(action_state=RunState.FAIL)
+
+            elem_list = elem_list_from_xml_tree(xml_path, self.useless_list, extra_config.get("min_dist", 30))
+
+            screenshot_labeled_path = Path(self.screenshot_after_path).joinpath(f"{step}_labeled.png")
+            labeled_img = draw_bbox_multi(screenshot_path, screenshot_labeled_path, elem_list)
+
+            cv2.namedWindow("image", cv2.WINDOW_NORMAL)
+            cv2.imshow("image", labeled_img)
+            cv2.waitKey(0)
+            cv2.destroyAllWindows()
+
+            user_input = "xxx"
+            logger.info(
+                "Choose one of the following actions you want to perform on the current screen:\n"
+                "tap, text, long_press, swipe, stop"
+            )
+
+            while (
+                user_input.lower() != ActionOp.TAP.value
+                and user_input.lower() != ActionOp.TEXT.value
+                and user_input.lower() != ActionOp.LONG_PRESS.value
+                and user_input.lower() != ActionOp.SWIPE.value
+                and user_input.lower() != ActionOp.STOP.value
+            ):
+                user_input = input("user_input: ")
+
+            if user_input.lower() == ActionOp.TAP.value:
+                logger.info(f"Which element do you want to tap? Choose a numeric tag from 1 to {len(elem_list)}:")
+                user_input = "xxx"
+                while not user_input.isnumeric() or int(user_input) > len(elem_list) or int(user_input) < 1:
+                    user_input = input("user_input: ")
+                tl, br = elem_list[int(user_input) - 1].bbox
+                x, y = (tl[0] + br[0]) // 2, (tl[1] + br[1]) // 2
+                action = EnvAction(action_type=EnvActionType.SYSTEM_TAP, coord=(x, y))
+                log_str = f"tap({int(user_input)}):::{elem_list[int(user_input) - 1].uid}\n"
+            elif user_input.lower() == ActionOp.TEXT.value:
+                logger.info(
+                    f"Which element do you want to input the text string? Choose a numeric tag from 1 to "
+                    f"{len(elem_list)}:"
+                )
+                input_area = "xxx"
+                while not input_area.isnumeric() or int(input_area) > len(elem_list) or int(input_area) < 1:
+                    input_area = input("user_input: ")
+                logger.info("Enter your input text below:")
+                user_input = ""
+                while not user_input:
+                    user_input = input("user_input: ")
+                action = EnvAction(action_type=EnvActionType.USER_INPUT, input_txt=user_input)
+                log_str = f"text({input_area}:sep:'{user_input}'):::{elem_list[int(input_area) - 1].uid}\n"
+            elif user_input.lower() == ActionOp.LONG_PRESS.value:
+                logger.info(
+                    f"Which element do you want to long press? Choose a numeric tag from 1 to {len(elem_list)}:"
+                )
+                user_input = "xxx"
+                while not user_input.isnumeric() or int(user_input) > len(elem_list) or int(user_input) < 1:
+                    user_input = input("user_input: ")
+                tl, br = elem_list[int(user_input) - 1].bbox
+                x, y = (tl[0] + br[0]) // 2, (tl[1] + br[1]) // 2
+                action = EnvAction(action_type=EnvActionType.USER_LONGPRESS, coord=(x, y))
+                log_str = f"long_press({int(user_input)}):::{elem_list[int(user_input) - 1].uid}\n"
+            elif user_input.lower() == ActionOp.SWIPE.value:
+                logger.info(
+                    "What is the direction of your swipe? Choose one from the following options:\n"
+                    "up, down, left, right"
+                )
+                user_input = ""
+                while (
+                    user_input != SwipeOp.UP.value
+                    and user_input != SwipeOp.DOWN.value
+                    and user_input != SwipeOp.LEFT.value
+                    and user_input != SwipeOp.RIGHT.value
+                ):
+                    user_input = input("user_input: ")
+                swipe_dir = user_input
+                logger.info(f"Which element do you want to swipe? Choose a numeric tag from 1 to {len(elem_list)}:")
+                while not user_input.isnumeric() or int(user_input) > len(elem_list) or int(user_input) < 1:
+                    user_input = input("user_input: ")
+                tl, br = elem_list[int(user_input) - 1].bbox
+                x, y = (tl[0] + br[0]) // 2, (tl[1] + br[1]) // 2
+
+                action = EnvAction(action_type=EnvActionType.USER_SWIPE, coord=(x, y), orient=swipe_dir)
+                log_str = f"swipe({int(user_input)}:sep:{swipe_dir}):::{elem_list[int(user_input) - 1].uid}\n"
+            elif user_input.lower() == ActionOp.STOP.value:
+                record_file.write("stop\n")
+                record_file.close()
+                break
+            else:
+                break
+
+            obs, _, _, _, info = env.step(action)
+            action_res = info["res"]
+            if action_res == ADB_EXEC_FAIL:
+                return AndroidActionOutput(action_state=RunState.FAIL)
+            record_file.write(log_str)
+
+            time.sleep(1)
+
+        return AndroidActionOutput(action_state=RunState.SUCCESS)
diff --git a/metagpt/ext/android_assistant/actions/parse_record.py b/metagpt/ext/android_assistant/actions/parse_record.py
new file mode 100644
index 0000000000..304daf6556
--- /dev/null
+++ b/metagpt/ext/android_assistant/actions/parse_record.py
@@ -0,0 +1,137 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : parse record to generate learned standard operations in stage=learn & mode=manual,
+#           LIKE scripts/document_generation.py
+
+import ast
+import re
+from pathlib import Path
+
+from metagpt.actions.action import Action
+from metagpt.config2 import config
+from metagpt.ext.android_assistant.actions.parse_record_an import RECORD_PARSE_NODE
+from metagpt.ext.android_assistant.prompts.operation_prompt import (
+    long_press_doc_template,
+    refine_doc_suffix,
+    swipe_doc_template,
+    tap_doc_template,
+    text_doc_template,
+)
+from metagpt.ext.android_assistant.utils.schema import (
+    ActionOp,
+    AndroidActionOutput,
+    RecordLogItem,
+    RunState,
+    SwipeOp,
+)
+from metagpt.logs import logger
+from metagpt.utils.common import encode_image
+
+
+class ParseRecord(Action):
+    name: str = "ParseRecord"
+    record_path: Path = ""
+    task_desc_path: Path = ""
+    screenshot_before_path: Path = ""
+    screenshot_after_path: Path = ""
+
+    async def run(self, task_dir: Path, docs_dir: Path):
+        doc_count = 0
+        self.record_path = Path(task_dir) / "record.txt"
+        self.task_desc_path = Path(task_dir) / "task_desc.txt"
+        self.screenshot_before_path = Path(task_dir) / "raw_screenshots"
+        self.screenshot_after_path = Path(task_dir) / "labeled_screenshots"
+        for path in [self.screenshot_before_path, self.screenshot_after_path]:
+            path.mkdir(parents=True, exist_ok=True)
+
+        task_desc = self.task_desc_path.read_text()
+        extra_config = config.extra
+
+        with open(self.record_path, "r") as record_file:
+            record_step_count = len(record_file.readlines()) - 1
+            record_file.seek(0)
+            for step in range(1, record_step_count + 1):
+                img_before_base64 = encode_image(self.screenshot_after_path.joinpath(f"{step}_labeled.png"))
+                img_after_base64 = encode_image(self.screenshot_after_path.joinpath(f"{step + 1}_labeled.png"))
+                rec = record_file.readline().strip()
+                action, resource_id = rec.split(":::")
+                action_type = action.split("(")[0]
+                # 构建Prompt
+                action_param = re.findall(r"\((.*?)\)", action)[0]
+                if action_type == ActionOp.TAP.value:
+                    prompt_template = tap_doc_template
+                    context = prompt_template.format(ui_element=action_param)
+                elif action_type == ActionOp.TEXT.value:
+                    input_area, input_text = action_param.split(":sep:")
+                    prompt_template = text_doc_template
+                    context = prompt_template.format(ui_element=input_area)
+                elif action_type == ActionOp.LONG_PRESS.value:
+                    prompt_template = long_press_doc_template
+                    context = prompt_template.format(ui_element=action_param)
+                elif action_type == ActionOp.SWIPE.value:
+                    swipe_area, swipe_dir = action_param.split(":sep:")
+                    if swipe_dir == SwipeOp.UP.value or swipe_dir == SwipeOp.DOWN.value:
+                        action_type = ActionOp.VERTICAL_SWIPE.value
+                    elif swipe_dir == SwipeOp.LEFT.value or swipe_dir == SwipeOp.RIGHT.value:
+                        action_type = ActionOp.HORIZONTAL_SWIPE.value
+                    prompt_template = swipe_doc_template
+                    context = prompt_template.format(swipe_dir=swipe_dir, ui_element=swipe_area)
+                else:
+                    break
+                context = context.format(task_desc=task_desc)
+
+                doc_name = resource_id + ".txt"
+                doc_path = docs_dir.joinpath(doc_name)
+
+                if doc_path.exists():
+                    try:
+                        doc_content = ast.literal_eval(doc_path.read_text())
+                    except Exception as exp:
+                        logger.error(f"ast parse doc: {doc_path} failed, exp: {exp}")
+                        continue
+
+                    if doc_content[action_type]:
+                        if extra_config.get("doc_refine", False):
+                            refine_context = refine_doc_suffix.format(old_doc=doc_content[action_type])
+                            context += refine_context
+                            logger.info(
+                                f"Documentation for the element {resource_id} already exists. The doc will be "
+                                f"refined based on the latest demo."
+                            )
+                        else:
+                            logger.info(
+                                f"Documentation for the element {resource_id} already exists. Turn on DOC_REFINE "
+                                f"in the config file if needed."
+                            )
+                            continue
+                else:
+                    doc_content = {"tap": "", "text": "", "v_swipe": "", "h_swipe": "", "long_press": ""}
+
+                logger.info(f"Waiting for GPT-4V to generate documentation for the element {resource_id}")
+                node = await RECORD_PARSE_NODE.fill(
+                    context=context, llm=self.llm, images=[img_before_base64, img_after_base64]
+                )
+                if "error" in node.content:
+                    return AndroidActionOutput(action_state=RunState.FAIL)
+                log_path = task_dir.joinpath("log_parse_record.txt")
+                prompt = node.compile(context=context, schema="json", mode="auto")
+                msg = node.content
+                doc_content[action_type] = msg
+
+                with open(log_path, "a") as logfile:
+                    log_item = RecordLogItem(
+                        step=step,
+                        prompt=prompt,
+                        image_before=img_before_base64,
+                        image_after=img_after_base64,
+                        response=node.content,
+                    )
+                    logfile.write(log_item.model_dump_json() + "\n")
+                with open(doc_path, "w") as outfile:
+                    outfile.write(str(doc_content))
+                doc_count += 1
+                logger.info(f"Documentation generated and saved to {doc_path}")
+
+            logger.info(f"Documentation generation phase completed. {doc_count} docs generated.")
+
+        return AndroidActionOutput(action_state=RunState.FINISH)
diff --git a/metagpt/ext/android_assistant/actions/parse_record_an.py b/metagpt/ext/android_assistant/actions/parse_record_an.py
new file mode 100644
index 0000000000..210c93e236
--- /dev/null
+++ b/metagpt/ext/android_assistant/actions/parse_record_an.py
@@ -0,0 +1,32 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : the ActionNode to parse record
+
+from metagpt.actions.action_node import ActionNode
+
+OBSERVATION = ActionNode(
+    key="Observation",
+    expected_type=str,
+    instruction="Provide a description of your observations of the two images. "
+    "Subsequently, delineate the distinctions between the first image and the second one.",
+    example="",
+)
+
+THOUGHT = ActionNode(
+    key="Thought",
+    expected_type=str,
+    instruction="Consider the impact of Action acting on UI elements.",
+    example="",
+)
+
+DESCRIPTION = ActionNode(
+    key="Description",
+    expected_type=str,
+    instruction="Describe the functionality of the UI element concisely in one or two sentences Do not include "
+    "the numeric tag in your description",
+    example="",
+)
+
+NODES = [OBSERVATION, THOUGHT, DESCRIPTION]
+
+RECORD_PARSE_NODE = ActionNode.from_children("RecordParse", NODES)
diff --git a/metagpt/ext/android_assistant/actions/screenshot_parse.py b/metagpt/ext/android_assistant/actions/screenshot_parse.py
new file mode 100644
index 0000000000..4d8bb0e1eb
--- /dev/null
+++ b/metagpt/ext/android_assistant/actions/screenshot_parse.py
@@ -0,0 +1,204 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : LIKE scripts/task_executor.py in stage=act
+
+import ast
+from pathlib import Path
+
+from metagpt.actions.action import Action
+from metagpt.config2 import config
+from metagpt.environment.android.android_env import AndroidEnv
+from metagpt.environment.android.const import ADB_EXEC_FAIL
+from metagpt.environment.android.env_space import (
+    EnvAction,
+    EnvActionType,
+    EnvObsParams,
+    EnvObsType,
+)
+from metagpt.ext.android_assistant.actions.screenshot_parse_an import (
+    SCREENSHOT_PARSE_NODE,
+)
+from metagpt.ext.android_assistant.prompts.assistant_prompt import (
+    screenshot_parse_template,
+    screenshot_parse_with_grid_template,
+)
+from metagpt.ext.android_assistant.utils.schema import (
+    AndroidActionOutput,
+    AndroidElement,
+    GridOpParam,
+    LongPressGridOpParam,
+    LongPressOpParam,
+    OpLogItem,
+    RunState,
+    SwipeGridOpParam,
+    SwipeOpParam,
+    TapGridOpParam,
+    TapOpParam,
+    TextOpParam,
+)
+from metagpt.ext.android_assistant.utils.utils import (
+    area_to_xy,
+    draw_bbox_multi,
+    draw_grid,
+    elem_bbox_to_xy,
+    screenshot_parse_extract,
+    traverse_xml_tree,
+)
+from metagpt.logs import logger
+from metagpt.utils.common import encode_image
+
+
+class ScreenshotParse(Action):
+    name: str = "ScreenshotParse"
+
+    def _makeup_ui_document(self, elem_list: list[AndroidElement], docs_idr: Path, use_exist_doc: bool = True) -> str:
+        if not use_exist_doc:
+            return ""
+
+        ui_doc = """
+You also have access to the following documentations that describes the functionalities of UI 
+elements you can interact on the screen. These docs are crucial for you to determine the target of your 
+next action. You should always prioritize these documented elements for interaction: """
+        for i, elem in enumerate(elem_list):
+            doc_path = docs_idr.joinpath(f"{elem.uid}.txt")
+            if not doc_path.exists():
+                continue
+            try:
+                doc_content = ast.literal_eval(doc_path.read_text())
+            except Exception as exp:
+                logger.error(f"ast parse doc: {doc_path} failed, exp: {exp}")
+                continue
+
+            ui_doc += f"Documentation of UI element labeled with the numeric tag '{i + 1}':\n"
+            if doc_content["tap"]:
+                ui_doc += f"This UI element is clickable. {doc_content['tap']}\n\n"
+            if doc_content["text"]:
+                ui_doc += (
+                    f"This UI element can receive text input. The text input is used for the following "
+                    f"purposes: {doc_content['text']}\n\n"
+                )
+            if doc_content["long_press"]:
+                ui_doc += f"This UI element is long clickable. {doc_content['long_press']}\n\n"
+            if doc_content["v_swipe"]:
+                ui_doc += (
+                    f"This element can be swiped directly without tapping. You can swipe vertically on "
+                    f"this UI element. {doc_content['v_swipe']}\n\n"
+                )
+            if doc_content["h_swipe"]:
+                ui_doc += (
+                    f"This element can be swiped directly without tapping. You can swipe horizontally on "
+                    f"this UI element. {doc_content['h_swipe']}\n\n"
+                )
+        return ui_doc
+
+    async def run(
+        self,
+        round_count: int,
+        task_desc: str,
+        last_act: str,
+        task_dir: Path,
+        docs_dir: Path,
+        grid_on: bool,
+        env: AndroidEnv,
+    ):
+        extra_config = config.extra
+        for path in [task_dir, docs_dir]:
+            path.mkdir(parents=True, exist_ok=True)
+        screenshot_path: Path = env.observe(
+            EnvObsParams(obs_type=EnvObsType.GET_SCREENSHOT, ss_name=f"{round_count}_before", local_save_dir=task_dir)
+        )
+        xml_path: Path = env.observe(
+            EnvObsParams(obs_type=EnvObsType.GET_XML, xml_name=f"{round_count}", local_save_dir=task_dir)
+        )
+        if not screenshot_path.exists() or not xml_path.exists():
+            return AndroidActionOutput(action_state=RunState.FAIL)
+
+        clickable_list = []
+        focusable_list = []
+        traverse_xml_tree(xml_path, clickable_list, "clickable", True)
+        traverse_xml_tree(xml_path, focusable_list, "focusable", True)
+        elem_list: list[AndroidElement] = clickable_list.copy()
+        for elem in focusable_list:
+            bbox = elem.bbox
+            center = (bbox[0][0] + bbox[1][0]) // 2, (bbox[0][1] + bbox[1][1]) // 2
+            close = False
+            for e in clickable_list:
+                bbox = e.bbox
+                center_ = (bbox[0][0] + bbox[1][0]) // 2, (bbox[0][1] + bbox[1][1]) // 2
+                dist = (abs(center[0] - center_[0]) ** 2 + abs(center[1] - center_[1]) ** 2) ** 0.5
+                if dist <= extra_config.get("min_dist", 30):
+                    close = True
+                    break
+            if not close:
+                elem_list.append(elem)
+
+        screenshot_labeled_path = task_dir.joinpath(f"{round_count}_labeled.png")
+        draw_bbox_multi(screenshot_path, screenshot_labeled_path, elem_list)
+        img_base64 = encode_image(screenshot_labeled_path)
+
+        parse_template = screenshot_parse_with_grid_template if grid_on else screenshot_parse_template
+
+        if grid_on:
+            env.rows, env.cols = draw_grid(screenshot_path, task_dir / f"{round_count}_grid.png")
+
+        ui_doc = self._makeup_ui_document(elem_list, docs_dir)
+        context = parse_template.format(ui_document=ui_doc, task_description=task_desc, last_act=last_act)
+        node = await SCREENSHOT_PARSE_NODE.fill(context=context, llm=self.llm, images=[img_base64])
+
+        if "error" in node.content:
+            return AndroidActionOutput(action_state=RunState.FAIL)
+
+        prompt = node.compile(context=context, schema="json", mode="auto")
+        OpLogItem(step=round_count, prompt=prompt, image=str(screenshot_labeled_path), response=node.content)
+
+        op_param = screenshot_parse_extract(node.instruct_content.model_dump(), grid_on)
+        if op_param.param_state == RunState.FINISH:
+            logger.info(f"op_param: {op_param}")
+            return AndroidActionOutput(action_state=RunState.FINISH)
+        if op_param.param_state == RunState.FAIL:
+            return AndroidActionOutput(action_state=RunState.FAIL)
+
+        last_act = op_param.last_act
+        if isinstance(op_param, TapOpParam):
+            x, y = elem_bbox_to_xy(elem_list[op_param.area - 1].bbox)
+            action = EnvAction(action_type=EnvActionType.SYSTEM_TAP, coord=(x, y))
+        elif isinstance(op_param, TextOpParam):
+            action = EnvAction(action_type=EnvActionType.USER_INPUT, input_txt=op_param.input_str)
+        elif isinstance(op_param, LongPressOpParam):
+            x, y = elem_bbox_to_xy(elem_list[op_param.area - 1].bbox)
+            action = EnvAction(action_type=EnvActionType.USER_LONGPRESS, coord=(x, y))
+        elif isinstance(op_param, SwipeOpParam):
+            x, y = elem_bbox_to_xy(elem_list[op_param.area - 1].bbox)
+            action = EnvAction(
+                action_type=EnvActionType.USER_SWIPE, coord=(x, y), orient=op_param.swipe_orient, dist=op_param.dist
+            )
+        elif isinstance(op_param, GridOpParam):
+            grid_on = True
+        elif isinstance(op_param, TapGridOpParam) or isinstance(op_param, LongPressGridOpParam):
+            x, y = area_to_xy(op_param.area, op_param.subarea, env.width, env.height, env.rows, env.cols)
+            if isinstance(op_param, TapGridOpParam):
+                action = EnvAction(action_type=EnvActionType.SYSTEM_TAP, coord=(x, y))
+            else:
+                # LongPressGridOpParam
+                action = EnvAction(action_type=EnvActionType.USER_LONGPRESS, coord=(x, y))
+        elif isinstance(op_param, SwipeGridOpParam):
+            start_x, start_y = area_to_xy(
+                op_param.start_area, op_param.start_subarea, env.width, env.height, env.rows, env.cols
+            )
+            end_x, end_y = area_to_xy(
+                op_param.end_area, op_param.end_subarea, env.width, env.height, env.rows, env.cols
+            )
+            action = EnvAction(
+                action_type=EnvActionType.USER_SWIPE_TO, coord=(start_x, start_y), tgt_coord=(end_x, end_y)
+            )
+
+        if not grid_on:
+            obs, _, _, _, info = env.step(action)
+            action_res = info["res"]
+            if action_res == ADB_EXEC_FAIL:
+                return AndroidActionOutput(action_state=RunState.FAIL)
+
+        if op_param.act_name != "grid":
+            grid_on = False
+
+        return AndroidActionOutput(data={"grid_on": grid_on, "last_act": last_act})
diff --git a/metagpt/ext/android_assistant/actions/screenshot_parse_an.py b/metagpt/ext/android_assistant/actions/screenshot_parse_an.py
new file mode 100644
index 0000000000..eb23ba9344
--- /dev/null
+++ b/metagpt/ext/android_assistant/actions/screenshot_parse_an.py
@@ -0,0 +1,48 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : the ActionNode to parse screenshot
+
+from metagpt.actions.action_node import ActionNode
+
+OBSERVATION = ActionNode(
+    key="Observation", expected_type=str, instruction="Describe what you observe in the image", example=""
+)
+
+THOUGHT = ActionNode(
+    key="Thought",
+    expected_type=str,
+    instruction="To complete the given task, what is the next step I should do",
+    example="",
+)
+
+ACTION = ActionNode(
+    key="Action",
+    expected_type=str,
+    instruction="The function call with the correct parameters to proceed with the task. If you believe the task is "
+    "completed or there is nothing to be done, you should output FINISH. You cannot output anything else "
+    "except a function call or FINISH in this field.",
+    example="",
+)
+
+SUMMARY = ActionNode(
+    key="Summary",
+    expected_type=str,
+    instruction="Summarize your past actions along with your latest action in one or two sentences. Do not include "
+    "the numeric tag in your summary",
+    example="",
+)
+
+SUMMARY_GRID = ActionNode(
+    key="Summary",
+    expected_type=str,
+    instruction="Summarize your past actions along with your latest action in one or two sentences. Do not include "
+    "the grid area number in your summary",
+    example="",
+)
+
+NODES = [OBSERVATION, THOUGHT, ACTION, SUMMARY]
+
+NODES_GRID = [OBSERVATION, THOUGHT, ACTION, SUMMARY_GRID]
+
+SCREENSHOT_PARSE_NODE = ActionNode.from_children("ScreenshotParse", NODES)
+SCREENSHOT_PARSE_GRID_NODE = ActionNode.from_children("ScreenshotParseGrid", NODES_GRID)
diff --git a/metagpt/ext/android_assistant/actions/self_learn_and_reflect.py b/metagpt/ext/android_assistant/actions/self_learn_and_reflect.py
new file mode 100644
index 0000000000..5e9cfbb454
--- /dev/null
+++ b/metagpt/ext/android_assistant/actions/self_learn_and_reflect.py
@@ -0,0 +1,231 @@
+# !/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : LIKE scripts/self_explorer.py in stage=learn & mode=auto self_explore_task stage
+
+import ast
+from pathlib import Path
+
+from metagpt.actions.action import Action
+from metagpt.config2 import config
+from metagpt.environment.android.android_env import AndroidEnv
+from metagpt.environment.android.const import ADB_EXEC_FAIL
+from metagpt.environment.android.env_space import (
+    EnvAction,
+    EnvActionType,
+    EnvObsParams,
+    EnvObsType,
+)
+from metagpt.ext.android_assistant.actions.screenshot_parse_an import (
+    SCREENSHOT_PARSE_NODE,
+)
+from metagpt.ext.android_assistant.actions.self_learn_reflect_an import (
+    SELF_LEARN_REFLECT_NODE,
+)
+from metagpt.ext.android_assistant.prompts.assistant_prompt import (
+    screenshot_parse_self_explore_reflect_template as reflect_template,
+)
+from metagpt.ext.android_assistant.prompts.assistant_prompt import (
+    screenshot_parse_self_explore_template,
+)
+from metagpt.ext.android_assistant.utils.schema import (
+    ActionOp,
+    AndroidActionOutput,
+    AndroidElement,
+    Decision,
+    DocContent,
+    LongPressOpParam,
+    OpLogItem,
+    ReflectLogItem,
+    RunState,
+    SwipeOp,
+    SwipeOpParam,
+    TapOpParam,
+    TextOpParam,
+)
+from metagpt.ext.android_assistant.utils.utils import (
+    draw_bbox_multi,
+    elem_bbox_to_xy,
+    elem_list_from_xml_tree,
+    reflect_parse_extarct,
+    screenshot_parse_extract,
+)
+from metagpt.logs import logger
+from metagpt.utils.common import encode_image
+
+
+class SelfLearnAndReflect(Action):
+    name: str = "SelfLearnAndReflect"
+
+    useless_list: list[str] = []  # store useless elements uid
+
+    screenshot_before_path: str = ""
+    screenshot_before_base64: str = ""
+    elem_list: list[AndroidElement] = []
+    swipe_orient: str = "up"
+    act_name: str = ""
+    ui_area: int = -1
+
+    async def run(
+        self, round_count: int, task_desc: str, last_act: str, task_dir: Path, docs_dir: Path, env: AndroidEnv
+    ) -> AndroidActionOutput:
+        for path in [task_dir, docs_dir]:
+            path.mkdir(parents=True, exist_ok=True)
+        resp = await self.run_self_learn(round_count, task_desc, last_act, task_dir, env)
+        if resp.action_state != RunState.SUCCESS:
+            return resp
+
+        resp = await self.run_reflect(round_count, task_desc, last_act, task_dir, docs_dir, env)
+        return resp
+
+    async def run_self_learn(
+        self, round_count: int, task_desc: str, last_act: str, task_dir: Path, env: AndroidEnv
+    ) -> AndroidActionOutput:
+        extra_config = config.extra
+        screenshot_path: Path = env.observe(
+            EnvObsParams(obs_type=EnvObsType.GET_SCREENSHOT, ss_name=f"{round_count}_before", local_save_dir=task_dir)
+        )
+        xml_path: Path = env.observe(
+            EnvObsParams(obs_type=EnvObsType.GET_XML, xml_name=f"{round_count}", local_save_dir=task_dir)
+        )
+        if not screenshot_path.exists() or not xml_path.exists():
+            return AndroidActionOutput(action_state=RunState.FAIL)
+
+        elem_list = elem_list_from_xml_tree(xml_path, self.useless_list, extra_config.get("min_dist", 30))
+
+        screenshot_before_labeled_path = task_dir.joinpath(f"{round_count}_before_labeled.png")
+        draw_bbox_multi(screenshot_path, screenshot_before_labeled_path, elem_list)
+        img_base64 = encode_image(screenshot_before_labeled_path)
+        self.screenshot_before_base64 = img_base64
+        self.screenshot_before_path = screenshot_before_labeled_path
+
+        self_explore_template = screenshot_parse_self_explore_template
+        context = self_explore_template.format(task_description=task_desc, last_act=last_act)
+
+        node = await SCREENSHOT_PARSE_NODE.fill(context=context, llm=self.llm, images=[img_base64])
+        logger.debug(f"fill result:{node}")
+        if "error" in node.content:
+            return AndroidActionOutput(action_state=RunState.FAIL)
+        prompt = node.compile(context=context, schema="json", mode="auto")
+        # Modify WindowsPath to Str
+        OpLogItem(step=round_count, prompt=prompt, image=str(screenshot_before_labeled_path), response=node.content)
+        op_param = screenshot_parse_extract(node.instruct_content.model_dump(), grid_on=False)
+        # TODO Modify Op_param. When op_param.action is FINISH, how to solve this ?
+        if op_param.param_state == RunState.FINISH:
+            return AndroidActionOutput(action_state=RunState.FINISH)
+        if op_param.param_state == RunState.FAIL:
+            return AndroidActionOutput(action_state=RunState.FAIL)
+
+        if isinstance(op_param, TapOpParam):
+            self.ui_area = op_param.area
+            x, y = elem_bbox_to_xy(elem_list[op_param.area - 1].bbox)
+            action = EnvAction(action_type=EnvActionType.SYSTEM_TAP, coord=(x, y))
+        elif isinstance(op_param, TextOpParam):
+            action = EnvAction(action_type=EnvActionType.USER_INPUT, input_txt=op_param.input_str)
+        elif isinstance(op_param, LongPressOpParam):
+            self.ui_area = op_param.area
+            x, y = elem_bbox_to_xy(elem_list[op_param.area - 1].bbox)
+            action = EnvAction(action_type=EnvActionType.USER_LONGPRESS, coord=(x, y))
+        elif isinstance(op_param, SwipeOpParam):
+            self.ui_area = op_param.area
+            self.swipe_orient = op_param.swipe_orient
+            x, y = elem_bbox_to_xy(elem_list[op_param.area - 1].bbox)
+            action = EnvAction(
+                action_type=EnvActionType.USER_SWIPE, coord=(x, y), orient=op_param.swipe_orient, dist=op_param.dist
+            )
+
+        obs, _, _, _, info = env.step(action)
+        action_res = info["res"]
+        if action_res == ADB_EXEC_FAIL:
+            return AndroidActionOutput(action_state=RunState.FAIL)
+
+        self.elem_list = elem_list
+        self.act_name = op_param.act_name
+        return AndroidActionOutput()
+
+    async def run_reflect(
+        self, round_count: int, task_desc: str, last_act: str, task_dir: Path, docs_dir: Path, env: AndroidEnv
+    ) -> AndroidActionOutput:
+        screenshot_path: Path = env.observe(
+            EnvObsParams(obs_type=EnvObsType.GET_SCREENSHOT, ss_name=f"{round_count}_after", local_save_dir=task_dir)
+        )
+        if not screenshot_path.exists():
+            return AndroidActionOutput(action_state=RunState.FAIL)
+
+        screenshot_after_labeled_path = task_dir.joinpath(f"{round_count}_after_labeled.png")
+        draw_bbox_multi(screenshot_path, screenshot_after_labeled_path, elem_list=self.elem_list)
+        img_base64 = encode_image(screenshot_after_labeled_path)
+        if self.act_name == ActionOp.TAP.value:
+            action = "tapping"
+        elif self.act_name == ActionOp.LONG_PRESS.value:
+            action = "long pressing"
+        elif self.act_name == ActionOp.SWIPE.value:
+            action = "swiping"
+            if self.swipe_orient == SwipeOp.UP.value or self.swipe_orient == SwipeOp.DOWN.value:
+                action = "v_swipe"
+            elif self.swipe_orient == SwipeOp.LEFT.value or self.swipe_orient == SwipeOp.RIGHT.value:
+                action = "h_swipe"
+        else:
+            # TODO Test for assignment, This error is eupiped with the next.
+            logger.warning(f"Current action name parse failed, it's `{self.act_name}`")
+            action = None
+        context = reflect_template.format(
+            action=action, ui_element=str(self.ui_area), task_desc=task_desc, last_act=last_act
+        )
+        node = await SELF_LEARN_REFLECT_NODE.fill(
+            context=context, llm=self.llm, images=[self.screenshot_before_base64, img_base64]
+        )
+
+        if "error" in node.content:
+            return AndroidActionOutput(action_state=RunState.FAIL)
+
+        prompt = node.compile(context=context, schema="json", mode="auto")
+        ReflectLogItem(
+            step=round_count,
+            prompt=prompt,
+            image_before=str(self.screenshot_before_path),
+            image_after=str(screenshot_after_labeled_path),
+            response=node.content,
+        )
+
+        op_param = reflect_parse_extarct(node.instruct_content.model_dump())
+        if op_param.param_state == RunState.FINISH:
+            return AndroidActionOutput(action_state=RunState.FINISH)
+        if op_param.param_state == RunState.FAIL:
+            return AndroidActionOutput(action_state=RunState.FAIL)
+
+        logger.info(
+            f"reflect_parse_extarct decision: {op_param.decision}, "
+            f"elem_list size: {len(self.elem_list)}, ui_area: {self.ui_area}"
+        )
+        # TODO here will cause `IndexError: list index out of range`.
+        #  Maybe you should clink back to the desktop in the simulator
+        resource_id = self.elem_list[int(self.ui_area) - 1].uid
+        if op_param.decision == Decision.INEFFECTIVE.value:
+            self.useless_list.append(resource_id)
+            last_act = "NONE"  # TODO global
+        elif op_param.decision in [Decision.BACK.value, Decision.CONTINUE.value, Decision.SUCCESS.value]:
+            if op_param.decision in [Decision.BACK.value, Decision.CONTINUE.value]:
+                self.useless_list.append(resource_id)
+                last_act = "NONE"
+                if op_param.decision == Decision.BACK.value:
+                    action = EnvAction(action_type=EnvActionType.SYSTEM_BACK)
+                    obs, _, _, _, info = env.step(action)
+                    if info["res"] == ADB_EXEC_FAIL:
+                        return AndroidActionOutput(action_state=RunState.FAIL)
+            doc = op_param.documentation
+            doc_path = docs_dir.joinpath(f"{resource_id}.txt")
+            if doc_path.exists():
+                try:
+                    doc_content = ast.literal_eval(doc_path.read_text())
+                except Exception as exp:
+                    logger.error(f"ast parse doc: {doc_path} failed, exp: {exp}")
+                    return AndroidActionOutput(action_state=RunState.FAIL)
+
+                if doc_content[self.act_name]:
+                    logger.info(f"Documentation for the element {resource_id} already exists.")
+                    return AndroidActionOutput(action_state=RunState.FAIL)
+            else:
+                doc_content = DocContent()
+                setattr(doc_content, self.act_name, doc)
+            doc_path.write_text(str(doc_content))
+        return AndroidActionOutput(data={"last_act": last_act})
diff --git a/metagpt/ext/android_assistant/actions/self_learn_reflect_an.py b/metagpt/ext/android_assistant/actions/self_learn_reflect_an.py
new file mode 100644
index 0000000000..305b7376af
--- /dev/null
+++ b/metagpt/ext/android_assistant/actions/self_learn_reflect_an.py
@@ -0,0 +1,21 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : the ActionNode to parse Reflection
+
+from metagpt.actions.action_node import ActionNode
+
+DECISION = ActionNode(
+    key="Decision", expected_type=str, instruction="explain why you made this decision", example="BACK"
+)
+
+
+THOUGHT = ActionNode(key="Thought", expected_type=str, instruction="explain why you made this decision", example="")
+
+
+DOCUMENTATION = ActionNode(
+    key="Documentation", expected_type=str, instruction="describe the function of the UI element", example=""
+)
+
+
+NODES = [DECISION, THOUGHT, DOCUMENTATION]
+SELF_LEARN_REFLECT_NODE = ActionNode.from_children("SelfLearnReflect", NODES)
diff --git a/metagpt/ext/android_assistant/prompts/__init__.py b/metagpt/ext/android_assistant/prompts/__init__.py
new file mode 100644
index 0000000000..2bcf8efd09
--- /dev/null
+++ b/metagpt/ext/android_assistant/prompts/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/metagpt/ext/android_assistant/prompts/assistant_prompt.py b/metagpt/ext/android_assistant/prompts/assistant_prompt.py
new file mode 100644
index 0000000000..34baf58417
--- /dev/null
+++ b/metagpt/ext/android_assistant/prompts/assistant_prompt.py
@@ -0,0 +1,168 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : the prompt templates of assistant learning and acting
+
+screenshot_parse_template = """You are an agent that is trained to perform some basic tasks on a smartphone. You will be given a 
+smartphone screenshot. The interactive UI elements on the screenshot are labeled with numeric tags starting from 1. The 
+numeric tag of each interactive element is located in the center of the element.
+
+You can call the following functions to control the smartphone:
+
+1. tap(element: int)
+This function is used to tap an UI element shown on the smartphone screen.
+"element" is a numeric tag assigned to an UI element shown on the smartphone screen.
+A simple use case can be tap(5), which taps the UI element labeled with the number 5.
+
+2. text(text_input: str)
+This function is used to insert text input in an input field/box. text_input is the string you want to insert and must 
+be wrapped with double quotation marks. A simple use case can be text("Hello, world!"), which inserts the string 
+"Hello, world!" into the input area on the smartphone screen. This function is usually callable when you see a keyboard 
+showing in the lower half of the screen.
+
+3. long_press(element: int)
+This function is used to long press an UI element shown on the smartphone screen.
+"element" is a numeric tag assigned to an UI element shown on the smartphone screen.
+A simple use case can be long_press(5), which long presses the UI element labeled with the number 5.
+
+4. swipe(element: int, direction: str, dist: str)
+This function is used to swipe an UI element shown on the smartphone screen, usually a scroll view or a slide bar.
+"element" is a numeric tag assigned to an UI element shown on the smartphone screen. "direction" is a string that 
+represents one of the four directions: up, down, left, right. "direction" must be wrapped with double quotation 
+marks. "dist" determines the distance of the swipe and can be one of the three options: short, medium, long. You should 
+choose the appropriate distance option according to your need.
+A simple use case can be swipe(21, "up", "medium"), which swipes up the UI element labeled with the number 21 for a 
+medium distance.
+
+5. grid()
+You should call this function when you find the element you want to interact with is not labeled with a numeric tag and 
+other elements with numeric tags cannot help with the task. The function will bring up a grid overlay to divide the 
+smartphone screen into small areas and this will give you more freedom to choose any part of the screen to tap, long 
+press, or swipe.
+{ui_document}
+The task you need to complete is to: {task_description}. Your past actions to proceed with this task are summarized as 
+follows: {last_act}
+Now, given the documentation and the following labeled screenshot, you need to think and call the function needed to 
+proceed with the task. Your output should include three parts in the given format:
+
+You can only take one action at a time, so please directly call the function."""
+
+screenshot_parse_with_grid_template = """You are an agent that is trained to perform some basic tasks on a smartphone. You will be given 
+a smartphone screenshot overlaid by a grid. The grid divides the screenshot into small square areas. Each area is 
+labeled with an integer in the top-left corner.
+
+You can call the following functions to control the smartphone:
+
+1. tap(area: int, subarea: str)
+This function is used to tap a grid area shown on the smartphone screen. "area" is the integer label assigned to a grid 
+area shown on the smartphone screen. "subarea" is a string representing the exact location to tap within the grid area. 
+It can take one of the nine values: center, top-left, top, top-right, left, right, bottom-left, bottom, and 
+bottom-right.
+A simple use case can be tap(5, "center"), which taps the exact center of the grid area labeled with the number 5.
+
+2. long_press(area: int, subarea: str)
+This function is used to long press a grid area shown on the smartphone screen. "area" is the integer label assigned to 
+a grid area shown on the smartphone screen. "subarea" is a string representing the exact location to long press within 
+the grid area. It can take one of the nine values: center, top-left, top, top-right, left, right, bottom-left, bottom, 
+and bottom-right.
+A simple use case can be long_press(7, "top-left"), which long presses the top left part of the grid area labeled with 
+the number 7.
+
+3. swipe(start_area: int, start_subarea: str, end_area: int, end_subarea: str)
+This function is used to perform a swipe action on the smartphone screen, especially when you want to interact with a 
+scroll view or a slide bar. "start_area" is the integer label assigned to the grid area which marks the starting 
+location of the swipe. "start_subarea" is a string representing the exact location to begin the swipe within the grid 
+area. "end_area" is the integer label assigned to the grid area which marks the ending location of the swipe. 
+"end_subarea" is a string representing the exact location to end the swipe within the grid area.
+The two subarea parameters can take one of the nine values: center, top-left, top, top-right, left, right, bottom-left, 
+bottom, and bottom-right.
+A simple use case can be swipe(21, "center", 25, "right"), which performs a swipe starting from the center of grid area 
+21 to the right part of grid area 25.
+
+The task you need to complete is to: {task_description}. Your past actions to proceed with this task are summarized as 
+follows: {last_act}
+Now, given the following labeled screenshot, you need to think and call the function needed to proceed with the task. 
+Your output should include three parts in the given format:
+
+You can only take one action at a time, so please directly call the function."""
+
+screenshot_parse_self_explore_template = """You are an agent that is trained to complete certain tasks on a smartphone. You will be 
+given a screenshot of a smartphone app. The interactive UI elements on the screenshot are labeled with numeric tags 
+starting from 1. 
+
+You can call the following functions to interact with those labeled elements to control the smartphone:
+
+1. tap(element: int)
+This function is used to tap an UI element shown on the smartphone screen.
+"element" is a numeric tag assigned to an UI element shown on the smartphone screen.
+A simple use case can be tap(5), which taps the UI element labeled with the number 5.
+
+2. text(text_input: str)
+This function is used to insert text input in an input field/box. text_input is the string you want to insert and must 
+be wrapped with double quotation marks. A simple use case can be text("Hello, world!"), which inserts the string 
+"Hello, world!" into the input area on the smartphone screen. This function is only callable when you see a keyboard 
+showing in the lower half of the screen.
+
+3. long_press(element: int)
+This function is used to long press an UI element shown on the smartphone screen.
+"element" is a numeric tag assigned to an UI element shown on the smartphone screen.
+A simple use case can be long_press(5), which long presses the UI element labeled with the number 5.
+
+4. swipe(element: int, direction: str, dist: str)
+This function is used to swipe an UI element shown on the smartphone screen, usually a scroll view or a slide bar.
+"element" is a numeric tag assigned to an UI element shown on the smartphone screen. "direction" is a string that 
+represents one of the four directions: up, down, left, right. "direction" must be wrapped with double quotation 
+marks. "dist" determines the distance of the swipe and can be one of the three options: short, medium, long. You should 
+choose the appropriate distance option according to your need.
+A simple use case can be swipe(21, "up", "medium"), which swipes up the UI element labeled with the number 21 for a 
+medium distance.
+
+The task you need to complete is to {task_description}. Your past actions to proceed with this task are summarized as 
+follows: {last_act}
+Now, given the following labeled screenshot, you need to think and call the function needed to proceed with the task. 
+Your output should include three parts in the given format:
+
+You can only take one action at a time, so please directly call the function."""
+
+screenshot_parse_self_explore_reflect_template = """I will give you screenshots of a mobile app before and after {action} the UI 
+element labeled with the number '{ui_element}' on the first screenshot. The numeric tag of each element is located at 
+the center of the element. The action of {action} this UI element was described as follows:
+{last_act}
+The action was also an attempt to proceed with a larger task, which is to {task_desc}. Your job is to carefully analyze 
+the difference between the two screenshots to determine if the action is in accord with the description above and at 
+the same time effectively moved the task forward. Your output should be determined based on the following situations:
+1. BACK
+If you think the action navigated you to a page where you cannot proceed with the given task, you should go back to the 
+previous interface. At the same time, describe the functionality of the UI element concisely in one or two sentences by 
+observing the difference between the two screenshots. Notice that your description of the UI element should focus on 
+the general function. Never include the numeric tag of the UI element in your description. You can use pronouns such as 
+"the UI element" to refer to the element. Your output should be in the following format:
+Decision: BACK
+Thought: <explain why you think the last action is wrong and you should go back to the previous interface>
+Documentation: <describe the function of the UI element>
+2. INEFFECTIVE
+If you find the action changed nothing on the screen (screenshots before and after the action are identical), you 
+should continue to interact with other elements on the screen. Notice that if you find the location of the cursor 
+changed between the two screenshots, then they are not identical. Your output should be in the following format:
+Decision: INEFFECTIVE
+Thought: <explain why you made this decision>
+Documentation: <None>
+3. CONTINUE
+If you find the action changed something on the screen but does not reflect the action description above and did not 
+move the given task forward, you should continue to interact with other elements on the screen. At the same time, 
+describe the functionality of the UI element concisely in one or two sentences by observing the difference between the 
+two screenshots. Notice that your description of the UI element should focus on the general function. Never include the 
+numeric tag of the UI element in your description. You can use pronouns such as "the UI element" to refer to the 
+element. Your output should be in the following format:
+Decision: CONTINUE
+Thought: <explain why you think the action does not reflect the action description above and did not move the given 
+task forward>
+Documentation: <describe the function of the UI element>
+4. SUCCESS
+If you think the action successfully moved the task forward (even though it did not completed the task), you should 
+describe the functionality of the UI element concisely in one or two sentences. Notice that your description of the UI 
+element should focus on the general function. Never include the numeric tag of the UI element in your description. You 
+can use pronouns such as "the UI element" to refer to the element. Your output should be in the following format:
+Decision: SUCCESS
+Thought: <explain why you think the action successfully moved the task forward>
+Documentation: <describe the function of the UI element>
+"""
diff --git a/metagpt/ext/android_assistant/prompts/operation_prompt.py b/metagpt/ext/android_assistant/prompts/operation_prompt.py
new file mode 100644
index 0000000000..1bde53f041
--- /dev/null
+++ b/metagpt/ext/android_assistant/prompts/operation_prompt.py
@@ -0,0 +1,45 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : the prompt templates of phone operation
+
+tap_doc_template = """I will give you the screenshot of a mobile app before and after tapping the UI element labeled 
+with the number {ui_element} on the screen. The numeric tag of each element is located at the center of the element. 
+Tapping this UI element is a necessary part of proceeding with a larger task, which is to <task_desc>. Your task is to 
+describe the functionality of the UI element concisely in one or two sentences. Notice that your description of the UI 
+element should focus on the general function. For example, if the UI element is used to navigate to the chat window 
+with John, your description should not include the name of the specific person. Just say: "Tapping this area will 
+navigate the user to the chat window". Never include the numeric tag of the UI element in your description. You can use 
+pronouns such as "the UI element" to refer to the element."""
+
+text_doc_template = """I will give you the screenshot of a mobile app before and after typing in the input area labeled
+with the number {ui_element} on the screen. The numeric tag of each element is located at the center of the element. 
+Typing in this UI element is a necessary part of proceeding with a larger task, which is to <task_desc>. Your task is 
+to describe the functionality of the UI element concisely in one or two sentences. Notice that your description of the 
+UI element should focus on the general function. For example, if the change of the screenshot shows that the user typed 
+"How are you?" in the chat box, you do not need to mention the actual text. Just say: "This input area is used for the 
+user to type a message to send to the chat window.". Never include the numeric tag of the UI element in your 
+description. You can use pronouns such as "the UI element" to refer to the element."""
+
+long_press_doc_template = """I will give you the screenshot of a mobile app before and after long pressing the UI 
+element labeled with the number {ui_element} on the screen. The numeric tag of each element is located at the center of 
+the element. Long pressing this UI element is a necessary part of proceeding with a larger task, which is to 
+<task_desc>. Your task is to describe the functionality of the UI element concisely in one or two sentences. Notice 
+that your description of the UI element should focus on the general function. For example, if long pressing the UI 
+element redirects the user to the chat window with John, your description should not include the name of the specific 
+person. Just say: "Long pressing this area will redirect the user to the chat window". Never include the numeric tag of 
+the UI element in your description. You can use pronouns such as "the UI element" to refer to the element."""
+
+swipe_doc_template = """I will give you the screenshot of a mobile app before and after swiping <swipe_dir> the UI 
+element labeled with the number {ui_element} on the screen. The numeric tag of each element is located at the center of 
+the element. Swiping this UI element is a necessary part of proceeding with a larger task, which is to <task_desc>. 
+Your task is to describe the functionality of the UI element concisely in one or two sentences. Notice that your 
+description of the UI element should be as general as possible. For example, if swiping the UI element increases the 
+contrast ratio of an image of a building, your description should be just like this: "Swiping this area enables the 
+user to tune a specific parameter of the image". Never include the numeric tag of the UI element in your description. 
+You can use pronouns such as "the UI element" to refer to the element."""
+
+refine_doc_suffix = """\nA documentation of this UI element generated from previous demos is shown below. Your 
+generated description should be based on this previous doc and optimize it. Notice that it is possible that your 
+understanding of the function of the UI element derived from the given screenshots conflicts with the previous doc, 
+because the function of a UI element can be flexible. In this case, your generated description should combine both.
+Old documentation of this UI element: {old_doc}"""
diff --git a/metagpt/ext/android_assistant/roles/__init__.py b/metagpt/ext/android_assistant/roles/__init__.py
new file mode 100644
index 0000000000..2bcf8efd09
--- /dev/null
+++ b/metagpt/ext/android_assistant/roles/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/metagpt/ext/android_assistant/roles/android_assistant.py b/metagpt/ext/android_assistant/roles/android_assistant.py
new file mode 100644
index 0000000000..45636f5191
--- /dev/null
+++ b/metagpt/ext/android_assistant/roles/android_assistant.py
@@ -0,0 +1,146 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : android assistant to learn from app operations and operate apps
+import time
+from datetime import datetime
+from pathlib import Path
+from typing import Optional
+
+from pydantic import Field
+
+from metagpt.actions.add_requirement import UserRequirement
+from metagpt.config2 import config
+from metagpt.const import EXAMPLE_PATH
+from metagpt.ext.android_assistant.actions.manual_record import ManualRecord
+from metagpt.ext.android_assistant.actions.parse_record import ParseRecord
+from metagpt.ext.android_assistant.actions.screenshot_parse import ScreenshotParse
+from metagpt.ext.android_assistant.actions.self_learn_and_reflect import (
+    SelfLearnAndReflect,
+)
+from metagpt.ext.android_assistant.utils.schema import AndroidActionOutput, RunState
+from metagpt.logs import logger
+from metagpt.roles.role import Role, RoleReactMode
+from metagpt.schema import Message
+
+
+class AndroidAssistant(Role):
+    name: str = "Nick"
+    profile: str = "AndroidAssistant"
+    goal: str = "operate the mobile phone's apps with self-learn"
+
+    task_desc: str = ""
+    round_count: int = 0
+    last_act: str = "None"
+    output_root_dir: Optional[Path] = Field(default=None)
+    task_dir: Optional[Path] = Field(default=None)
+    docs_dir: Optional[Path] = Field(default=None)
+    grid_on: bool = Field(default=False)
+
+    def __init__(self, **data):
+        super().__init__(**data)
+
+        self._watch([UserRequirement, AndroidActionOutput])
+        extra_config = config.extra
+        self.task_desc = extra_config.get("task_desc", "Just explore any app in this phone!")
+        app_name = extra_config.get("app_name", "demo")
+        data_dir = self.output_root_dir.absolute().joinpath("output") or EXAMPLE_PATH.joinpath(
+            "android_assistant/output"
+        )
+        cur_datetime = datetime.fromtimestamp(int(time.time())).strftime("%Y-%m-%d_%H-%M-%S")
+
+        """Firstly, we decide the state with user config, further, we can do it automatically, like if it's new app,
+        run the learn first and then do the act stage or learn it during the action.
+        """
+        stage = extra_config.get("stage")
+        mode = extra_config.get("mode")
+        if stage == "learn" and mode == "manual":
+            # choose ManualRecord and then run ParseRecord
+            # Remember, only run each action only one time, no need to run n_round.
+            self.set_actions([ManualRecord, ParseRecord])
+            self.task_dir = data_dir.joinpath(app_name, f"manual_learn_{cur_datetime}")
+            self.docs_dir = data_dir.joinpath(app_name, "manual_docs")
+        elif stage == "learn" and mode == "auto":
+            # choose SelfLearnAndReflect to run
+            self.set_actions([SelfLearnAndReflect])
+            self.task_dir = data_dir.joinpath(app_name, f"auto_learn_{cur_datetime}")
+            self.docs_dir = data_dir.joinpath(app_name, "auto_docs")
+        elif stage == "act":
+            # choose ScreenshotParse to run
+            self.set_actions([ScreenshotParse])
+            self.task_dir = data_dir.joinpath(app_name, f"act_{cur_datetime}")
+            if mode == "manual":
+                self.docs_dir = data_dir.joinpath(app_name, "manual_docs")
+            else:
+                self.docs_dir = data_dir.joinpath(app_name, "auto_docs")
+        else:
+            raise ValueError(f"invalid stage: {stage}, mode: {mode}")
+
+        self._check_dir()
+
+        self._set_react_mode(RoleReactMode.BY_ORDER)
+
+    def _check_dir(self):
+        self.task_dir.mkdir(parents=True, exist_ok=True)
+        self.docs_dir.mkdir(parents=True, exist_ok=True)
+
+    async def react(self) -> Message:
+        self.round_count += 1
+        result = await super().react()
+        logger.debug(f"react result {result}")
+        return result
+
+    async def _observe(self, ignore_memory=True) -> int:
+        """ignore old memory to make it run multi rounds inside a role"""
+        newest_msgs = self.rc.memory.get(k=1)
+        newest_msg = newest_msgs[0] if newest_msgs else None
+        if newest_msg and (RunState.SUCCESS.value.upper() not in newest_msg.content):
+            ignore_memory = False
+            state_val = newest_msg.content.split(".")[-1]  # RoundCount: 1, action_state: RunState.SUCCESS
+            logger.warning(f"Latest action_state is {state_val}, will run in the remainder rounds without `react`")
+        return await super()._observe(ignore_memory)
+
+    async def _act(self) -> Message:
+        logger.info(f"{self._setting}: to do {self.rc.todo}({self.rc.todo.name})")
+        todo = self.rc.todo
+        if isinstance(todo, ManualRecord):
+            resp = await todo.run(task_dir=self.task_dir, task_desc=self.task_desc, env=self.rc.env)
+        elif isinstance(todo, ParseRecord):
+            resp = await todo.run(
+                task_dir=self.task_dir,
+                docs_dir=self.docs_dir,
+            )
+        elif isinstance(todo, SelfLearnAndReflect):
+            resp = await todo.run(
+                round_count=self.round_count,
+                task_desc=self.task_desc,
+                last_act=self.last_act,
+                task_dir=self.task_dir,
+                docs_dir=self.docs_dir,
+                env=self.rc.env,
+            )
+            if resp.action_state == RunState.SUCCESS:
+                self.last_act = resp.data.get("last_act")
+        elif isinstance(todo, ScreenshotParse):
+            resp = await todo.run(
+                round_count=self.round_count,
+                task_desc=self.task_desc,
+                last_act=self.last_act,
+                task_dir=self.task_dir,
+                docs_dir=self.docs_dir,
+                grid_on=self.grid_on,
+                env=self.rc.env,
+            )
+            if resp.action_state == RunState.SUCCESS:
+                logger.info(f"grid_on:  {resp.data.get('grid_on')}")
+                self.grid_on = resp.data.get("grid_on", False)
+                self.last_act = resp.data.get("last_act", "None")
+        msg = Message(
+            content=f"RoundCount: {self.round_count}, action_state: {resp.action_state}",
+            role=self.profile,
+            cause_by=type(resp),
+            send_from=self.name,
+            send_to=self.name,
+        )
+
+        self.rc.memory.add(msg)
+        return msg
diff --git a/metagpt/ext/android_assistant/utils/__init__.py b/metagpt/ext/android_assistant/utils/__init__.py
new file mode 100644
index 0000000000..2bcf8efd09
--- /dev/null
+++ b/metagpt/ext/android_assistant/utils/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/metagpt/ext/android_assistant/utils/schema.py b/metagpt/ext/android_assistant/utils/schema.py
new file mode 100644
index 0000000000..c066f98b62
--- /dev/null
+++ b/metagpt/ext/android_assistant/utils/schema.py
@@ -0,0 +1,158 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
+
+from enum import Enum
+
+from pydantic import BaseModel, Field, field_validator
+
+
+class ActionOp(Enum):
+    TAP = "tap"
+    LONG_PRESS = "long_press"
+    TEXT = "text"
+    SWIPE = "swipe"
+    VERTICAL_SWIPE = "v_swipe"
+    HORIZONTAL_SWIPE = "h_swipe"
+    GRID = "grid"
+    STOP = "stop"
+
+
+class SwipeOp(Enum):
+    UP = "up"
+    DOWN = "down"
+    LEFT = "left"
+    RIGHT = "right"
+
+
+class Decision(Enum):
+    BACK = "BACK"
+    INEFFECTIVE = "INEFFECTIVE"
+    CONTINUE = "CONTINUE"
+    SUCCESS = "SUCCESS"
+
+    @classmethod
+    def values(cls):
+        return [item.value for item in cls]
+
+
+class AndroidElement(BaseModel):
+    """UI Element"""
+
+    uid: str = Field(default="")
+    bbox: tuple[tuple[int, int], tuple[int, int]] = Field(default={})
+    attrib: str = Field(default="")
+
+
+class OpLogItem(BaseModel):
+    """log content for self-learn or task act"""
+
+    step: int = Field(default=0)
+    prompt: str = Field(default="")
+    image: str = Field(default="")
+    response: str = Field(default="")
+
+
+class ReflectLogItem(BaseModel):
+    """log content for self-learn-reflect"""
+
+    step: int = Field(default=0)
+    prompt: str = Field(default="")
+    image_before: str = Field(default="")
+    image_after: str = Field(default="")
+    response: str = Field(default="")
+
+
+class RecordLogItem(BaseModel):
+    """log content for record parse, same as ReflectLogItem"""
+
+    step: int = Field(default=0)
+    prompt: str = Field(default="")
+    image_before: str = Field(default="")
+    image_after: str = Field(default="")
+    response: str = Field(default="")
+
+
+class DocContent(BaseModel):
+    tap: str = Field(default="")
+    text: str = Field(default="")
+    v_swipe: str = Field(default="")
+    h_swipe: str = Field(default="")
+    long_press: str = Field(default="")
+
+
+# start =================== define different Action Op and its params =============
+class RunState(Enum):
+    """run state"""
+
+    SUCCESS = "success"
+    FINISH = "finish"
+    FAIL = "fail"
+
+
+class BaseOpParam(BaseModel):
+    act_name: str = Field(default="", validate_default=True)
+    last_act: str = Field(default="None")
+    param_state: RunState = Field(default=RunState.SUCCESS, description="return state when extract params")
+
+
+class TapOpParam(BaseOpParam):
+    area: int = Field(default=-1)
+
+
+class TextOpParam(BaseOpParam):
+    input_str: str = Field(default="")
+
+
+class LongPressOpParam(BaseOpParam):
+    area: int = Field(default=-1)
+
+
+# Modify This SwipeOp to SwipeOpParam, Need better name
+class SwipeOpParam(BaseOpParam):
+    area: int = Field(default=-1)
+    swipe_orient: str = Field(default="up")
+    dist: str = Field(default="")
+
+
+class GridOpParam(BaseOpParam):
+    act_name: str = Field(default="")
+
+
+class BaseGridOpParam(BaseOpParam):
+    @field_validator("act_name", mode="before")
+    @classmethod
+    def check_act_name(cls, act_name: str) -> str:
+        return f"{act_name}_grid"
+
+
+class TapGridOpParam(BaseGridOpParam):
+    area: int = Field(default=-1)
+    subarea: str = Field(default="")
+
+
+class LongPressGridOpParam(BaseGridOpParam):
+    area: int = Field(default=-1)
+    subarea: str = Field(default="")
+
+
+class SwipeGridOpParam(BaseGridOpParam):
+    start_area: int = Field(default=-1)
+    start_subarea: str = Field(default="")
+    end_area: int = Field(default=-1)
+    end_subarea: str = Field(default="")
+
+
+# end =================== define different Action Op and its params =============
+
+
+class ReflectOp(BaseModel):
+    decision: str = ""
+    thought: str = ""
+    documentation: str = ""
+    param_state: RunState = RunState.SUCCESS
+
+
+class AndroidActionOutput(BaseModel):
+    data: dict = Field(default=dict())
+    action_state: RunState = Field(default=RunState.SUCCESS)
diff --git a/metagpt/ext/android_assistant/utils/utils.py b/metagpt/ext/android_assistant/utils/utils.py
new file mode 100644
index 0000000000..f1fa138692
--- /dev/null
+++ b/metagpt/ext/android_assistant/utils/utils.py
@@ -0,0 +1,329 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
+
+import re
+from pathlib import Path
+from typing import Union
+from xml.etree.ElementTree import Element, iterparse
+
+import cv2
+import pyshine as ps
+
+from metagpt.config2 import config
+from metagpt.ext.android_assistant.utils.schema import (
+    ActionOp,
+    AndroidElement,
+    BaseGridOpParam,
+    BaseOpParam,
+    Decision,
+    GridOpParam,
+    LongPressGridOpParam,
+    LongPressOpParam,
+    ReflectOp,
+    RunState,
+    SwipeGridOpParam,
+    SwipeOpParam,
+    TapGridOpParam,
+    TapOpParam,
+    TextOpParam,
+)
+from metagpt.logs import logger
+
+
+def get_id_from_element(elem: Element) -> str:
+    bounds = elem.attrib["bounds"][1:-1].split("][")
+    x1, y1 = map(int, bounds[0].split(","))
+    x2, y2 = map(int, bounds[1].split(","))
+    elem_w, elem_h = x2 - x1, y2 - y1
+    if "resource-id" in elem.attrib and elem.attrib["resource-id"]:
+        elem_id = elem.attrib["resource-id"].replace(":", ".").replace("/", "_")
+    else:
+        elem_id = f"{elem.attrib['class']}_{elem_w}_{elem_h}"
+    if "content-desc" in elem.attrib and elem.attrib["content-desc"] and len(elem.attrib["content-desc"]) < 20:
+        content_desc = elem.attrib["content-desc"].replace("/", "_").replace(" ", "").replace(":", "_")
+        elem_id += f"_{content_desc}"
+    return elem_id
+
+
+def traverse_xml_tree(xml_path: Path, elem_list: list[AndroidElement], attrib: str, add_index=False):
+    path = []
+    extra_config = config.extra
+    for event, elem in iterparse(str(xml_path), ["start", "end"]):
+        if event == "start":
+            path.append(elem)
+            if attrib in elem.attrib and elem.attrib[attrib] == "true":
+                parent_prefix = ""
+                if len(path) > 1:
+                    parent_prefix = get_id_from_element(path[-2])
+                bounds = elem.attrib["bounds"][1:-1].split("][")
+                x1, y1 = map(int, bounds[0].split(","))
+                x2, y2 = map(int, bounds[1].split(","))
+                center = (x1 + x2) // 2, (y1 + y2) // 2
+                elem_id = get_id_from_element(elem)
+                if parent_prefix:
+                    elem_id = parent_prefix + "_" + elem_id
+                if add_index:
+                    elem_id += f"_{elem.attrib['index']}"
+                close = False
+                for e in elem_list:
+                    bbox = e.bbox
+                    center_ = (bbox[0][0] + bbox[1][0]) // 2, (bbox[0][1] + bbox[1][1]) // 2
+                    dist = (abs(center[0] - center_[0]) ** 2 + abs(center[1] - center_[1]) ** 2) ** 0.5
+                    if dist <= extra_config.get("min_dist", 30):
+                        close = True
+                        break
+                if not close:
+                    elem_list.append(AndroidElement(uid=elem_id, bbox=((x1, y1), (x2, y2)), attrib=attrib))
+
+        if event == "end":
+            path.pop()
+
+
+def elem_list_from_xml_tree(xml_path: Path, useless_list: list[str], min_dist: int) -> list[AndroidElement]:
+    clickable_list = []
+    focusable_list = []
+    traverse_xml_tree(xml_path, clickable_list, "clickable", True)
+    traverse_xml_tree(xml_path, focusable_list, "focusable", True)
+    elem_list = []
+    for elem in clickable_list:
+        if elem.uid in useless_list:
+            continue
+        elem_list.append(elem)
+    for elem in focusable_list:
+        if elem.uid in useless_list:
+            continue
+        bbox = elem.bbox
+        center = (bbox[0][0] + bbox[1][0]) // 2, (bbox[0][1] + bbox[1][1]) // 2
+        close = False
+        for e in clickable_list:
+            bbox = e.bbox
+            center_ = (bbox[0][0] + bbox[1][0]) // 2, (bbox[0][1] + bbox[1][1]) // 2
+            dist = (abs(center[0] - center_[0]) ** 2 + abs(center[1] - center_[1]) ** 2) ** 0.5
+            if dist <= min_dist:
+                close = True
+                break
+        if not close:
+            elem_list.append(elem)
+    return elem_list
+
+
+def draw_bbox_multi(
+    img_path: Path,
+    output_path: Path,
+    elem_list: list[AndroidElement],
+    record_mode: bool = False,
+    dark_mode: bool = False,
+):
+    imgcv = cv2.imread(str(img_path))
+    count = 1
+    for elem in elem_list:
+        try:
+            top_left = elem.bbox[0]
+            bottom_right = elem.bbox[1]
+            left, top = top_left[0], top_left[1]
+            right, bottom = bottom_right[0], bottom_right[1]
+            label = str(count)
+            if record_mode:
+                if elem.attrib == "clickable":
+                    color = (250, 0, 0)
+                elif elem.attrib == "focusable":
+                    color = (0, 0, 250)
+                else:
+                    color = (0, 250, 0)
+                imgcv = ps.putBText(
+                    imgcv,
+                    label,
+                    text_offset_x=(left + right) // 2 + 10,
+                    text_offset_y=(top + bottom) // 2 + 10,
+                    vspace=10,
+                    hspace=10,
+                    font_scale=1,
+                    thickness=2,
+                    background_RGB=color,
+                    text_RGB=(255, 250, 250),
+                    alpha=0.5,
+                )
+            else:
+                text_color = (10, 10, 10) if dark_mode else (255, 250, 250)
+                bg_color = (255, 250, 250) if dark_mode else (10, 10, 10)
+                imgcv = ps.putBText(
+                    imgcv,
+                    label,
+                    text_offset_x=(left + right) // 2 + 10,
+                    text_offset_y=(top + bottom) // 2 + 10,
+                    vspace=10,
+                    hspace=10,
+                    font_scale=1,
+                    thickness=2,
+                    background_RGB=bg_color,
+                    text_RGB=text_color,
+                    alpha=0.5,
+                )
+        except Exception as e:
+            logger.error(f"ERROR: An exception occurs while labeling the image\n{e}")
+        count += 1
+    cv2.imwrite(str(output_path), imgcv)
+    return imgcv
+
+
+def draw_grid(img_path: Path, output_path: Path) -> tuple[int, int]:
+    def get_unit_len(n):
+        for i in range(1, n + 1):
+            if n % i == 0 and 120 <= i <= 180:
+                return i
+        return -1
+
+    image = cv2.imread(str(img_path))
+    height, width, _ = image.shape
+    color = (255, 116, 113)
+    unit_height = get_unit_len(height)
+    if unit_height < 0:
+        unit_height = 120
+    unit_width = get_unit_len(width)
+    if unit_width < 0:
+        unit_width = 120
+    thick = int(unit_width // 50)
+    rows = height // unit_height
+    cols = width // unit_width
+    for i in range(rows):
+        for j in range(cols):
+            label = i * cols + j + 1
+            left = int(j * unit_width)
+            top = int(i * unit_height)
+            right = int((j + 1) * unit_width)
+            bottom = int((i + 1) * unit_height)
+            cv2.rectangle(image, (left, top), (right, bottom), color, thick // 2)
+            cv2.putText(
+                image,
+                str(label),
+                (left + int(unit_width * 0.05) + 3, top + int(unit_height * 0.3) + 3),
+                0,
+                int(0.01 * unit_width),
+                (0, 0, 0),
+                thick,
+            )
+            cv2.putText(
+                image,
+                str(label),
+                (left + int(unit_width * 0.05), top + int(unit_height * 0.3)),
+                0,
+                int(0.01 * unit_width),
+                color,
+                thick,
+            )
+    cv2.imwrite(str(output_path), image)
+    return rows, cols
+
+
+def area_to_xy(area: int, subarea: str, width: int, height: int, rows: int, cols: int) -> tuple[int, int]:
+    area -= 1
+    row, col = area // cols, area % cols
+    x_0, y_0 = col * (width // cols), row * (height // rows)
+    if subarea == "top-left":
+        x, y = x_0 + (width // cols) // 4, y_0 + (height // rows) // 4
+    elif subarea == "top":
+        x, y = x_0 + (width // cols) // 2, y_0 + (height // rows) // 4
+    elif subarea == "top-right":
+        x, y = x_0 + (width // cols) * 3 // 4, y_0 + (height // rows) // 4
+    elif subarea == "left":
+        x, y = x_0 + (width // cols) // 4, y_0 + (height // rows) // 2
+    elif subarea == "right":
+        x, y = x_0 + (width // cols) * 3 // 4, y_0 + (height // rows) // 2
+    elif subarea == "bottom-left":
+        x, y = x_0 + (width // cols) // 4, y_0 + (height // rows) * 3 // 4
+    elif subarea == "bottom":
+        x, y = x_0 + (width // cols) // 2, y_0 + (height // rows) * 3 // 4
+    elif subarea == "bottom-right":
+        x, y = x_0 + (width // cols) * 3 // 4, y_0 + (height // rows) * 3 // 4
+    else:
+        x, y = x_0 + (width // cols) // 2, y_0 + (height // rows) // 2
+    return x, y
+
+
+def elem_bbox_to_xy(bbox: tuple[tuple[int, int], tuple[int, int]]) -> tuple[int, int]:
+    tl, br = bbox
+    x, y = (tl[0] + br[0]) // 2, (tl[1] + br[1]) // 2
+    return x, y
+
+
+def reflect_parse_extarct(parsed_json: dict) -> ReflectOp:
+    decision = parsed_json.get("Decision")
+    if decision not in Decision.values():
+        op = ReflectOp(param_state=RunState.FAIL)
+    else:
+        op = ReflectOp(
+            decision=parsed_json.get("Decision"),
+            thought=parsed_json.get("Thought"),
+            documentation=parsed_json.get("Documentation"),
+        )
+    return op
+
+
+def screenshot_parse_extract(
+    parsed_json: dict, grid_on: bool = False
+) -> Union[BaseOpParam, BaseGridOpParam, GridOpParam]:
+    act = parsed_json.get("Action")
+    last_act = parsed_json.get("Summary")
+    act_name = act.split("(")[0]
+
+    if RunState.FINISH.value.upper() in act:
+        return BaseOpParam(param_state=RunState.FINISH)
+
+    if grid_on:
+        return screenshot_parse_extract_with_grid(act_name, act, last_act)
+    else:
+        return screenshot_parse_extract_without_grid(act_name, act, last_act)
+
+
+def op_params_clean(params: list[str]) -> list[Union[int, str]]:
+    param_values = []
+    for param_value in params:
+        if '"' in param_value or "'" in param_value:  # remove `"`
+            param_values.append(param_value.strip()[1:-1])
+        else:
+            param_values.append(int(param_value))
+    return param_values
+
+
+def screenshot_parse_extract_without_grid(act_name: str, act: str, last_act: str) -> Union[BaseOpParam, GridOpParam]:
+    if act_name == ActionOp.TAP.value:
+        area = int(re.findall(r"tap\((.*?)\)", act)[0])
+        op = TapOpParam(act_name=act_name, area=area, last_act=last_act)
+    elif act_name == ActionOp.TEXT.value:
+        input_str = re.findall(r"text\((.*?)\)", act)[0][1:-1]
+        op = TextOpParam(act_name=act_name, input_str=input_str, last_act=last_act)
+    elif act_name == ActionOp.LONG_PRESS.value:
+        area = int(re.findall(r"long_press\((.*?)\)", act)[0])
+        op = LongPressOpParam(act_name=act_name, area=area, last_act=last_act)
+    elif act_name == ActionOp.SWIPE.value:
+        params = re.findall(r"swipe\((.*?)\)", act)[0].split(",")
+        params = op_params_clean(params)  # area, swipe_orient, dist
+        op = SwipeOpParam(act_name=act_name, area=params[0], swipe_orient=params[1], dist=params[2], last_act=last_act)
+    elif act_name == ActionOp.GRID.value:
+        op = GridOpParam(act_name=act_name)
+    else:
+        op = BaseOpParam(param_state=RunState.FAIL)
+    return op
+
+
+def screenshot_parse_extract_with_grid(act_name: str, act: str, last_act: str) -> Union[BaseGridOpParam, GridOpParam]:
+    if act_name == ActionOp.TAP.value:
+        params = re.findall(r"tap\((.*?)\)", act)[0].split(",")
+        params = op_params_clean(params)
+        op = TapGridOpParam(act_name=act_name, area=params[0], subarea=params[1], last_act=last_act)
+    elif act_name == ActionOp.LONG_PRESS.value:
+        params = re.findall(r"long_press\((.*?)\)", act)[0].split(",")
+        params = op_params_clean(params)
+        op = LongPressGridOpParam(act_name=act_name, area=params[0], subarea=params[1], last_act=last_act)
+    elif act_name == ActionOp.SWIPE.value:
+        params = re.findall(r"swipe\((.*?)\)", act)[0].split(",")
+        params = op_params_clean(params)
+        op = SwipeGridOpParam(
+            act_name=act_name, start_area=params[0], start_subarea=params[1], end_area=params[2], end_subarea=params[3]
+        )
+    elif act_name == ActionOp.GRID.value:
+        op = GridOpParam(act_name=act_name)
+    else:
+        op = BaseGridOpParam(param_state=RunState.FAIL)
+    return op
diff --git a/metagpt/ext/stanford_town/README.md b/metagpt/ext/stanford_town/README.md
new file mode 100644
index 0000000000..1bdcac145f
--- /dev/null
+++ b/metagpt/ext/stanford_town/README.md
@@ -0,0 +1,51 @@
+## Stanford Town Game
+
+### Pre-Description
+In order to facilitate GA( [generative_agents](https://github.com/joonspk-research/generative_agents) )'s frontend docking data (to avoid changing its code), you can set the value `temp_storage_path` to `temp_storage` of `generative_agents` when start `run_st_game.py`. like
+
+`python3 run_st_game.py --temp_storage_path path/to/ga/temp_storage xxx`  
+
+Or change the path under `const.py` like beflow  
+
+```
+STORAGE_PATH = EXAMPLE_PATH.joinpath("storage")
+TEMP_STORAGE_PATH = EXAMPLE_PATH.joinpath("temp_storage")
+# updated
+STORAGE_PATH = Path("{path/to/ga/storage}")
+TEMP_STORAGE_PATH = Path("{path/to/ga/temp_storage}")
+```
+
+This can be used to achieve docking of simulation data without changing the GA code. Otherwise, the GA code must be modified to adapt to the MG output path.  
+
+If you don't want to start from 0, copy other simulation directories under `generative_agents/environment/frontend_server/storage/` to `examples/stanford_town/storage`, and select a directory named `fork_sim_code`.  
+
+### Backend service startup
+The execution entry is `python3 run_st_game.py "Host a open lunch party at 13:00 pm" "base_the_ville_isabella_maria_klaus" "test_sim" 10`  
+or   
+`python3 run_st_game.py "Host a open lunch party at 13:00 pm" "base_the_ville_isabella_maria_klaus" "test_sim" 10 --temp_storage_path path/to/ga/temp_storage`  
+
+`idea` is the user's voice to the first Agent, and it is disseminated through this voice to see whether the final multi-agents achieve the goal of hosting or participating in the event.  
+
+### Frontend service startup
+Enter project folder `generative_agents`  
+
+Enter `environment/frontend_server` and use `python3 manage.py runserver` to start the front-end service.  
+Visit `http://localhost:8000/simulator_home` to enter the current simulation interface.  
+
+## Acknowledgements
+The reproduction work has referred the [generative_agents](https://github.com/joonspk-research/generative_agents), let's make a general statement here.  
+
+### Citation
+```bib
+@inproceedings{Park2023GenerativeAgents,  
+author = {Park, Joon Sung and O'Brien, Joseph C. and Cai, Carrie J. and Morris, Meredith Ringel and Liang, Percy and Bernstein, Michael S.},  
+title = {Generative Agents: Interactive Simulacra of Human Behavior},  
+year = {2023},  
+publisher = {Association for Computing Machinery},  
+address = {New York, NY, USA},  
+booktitle = {In the 36th Annual ACM Symposium on User Interface Software and Technology (UIST '23)},  
+keywords = {Human-AI interaction, agents, generative AI, large language models},  
+location = {San Francisco, CA, USA},  
+series = {UIST '23}
+}
+```
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/README_CN.md b/metagpt/ext/stanford_town/README_CN.md
new file mode 100644
index 0000000000..3daf68d08f
--- /dev/null
+++ b/metagpt/ext/stanford_town/README_CN.md
@@ -0,0 +1,50 @@
+## Stanford Town Game
+
+### 前置
+为了方便GA（ [generative_agents](https://github.com/joonspk-research/generative_agents) ）的前端对接数据（避免改动它那块的代码），可在启动`run_st_game.py`加上`temp_storage_path`指向`generative_agents`对应的`temp_storage`路径。比如
+
+`python3 run_st_game.py --temp_storage_path path/to/ga/temp_storage xxx`   
+
+或将`const.py`下的
+
+```
+STORAGE_PATH = EXAMPLE_PATH.joinpath("storage")
+TEMP_STORAGE_PATH = EXAMPLE_PATH.joinpath("temp_storage")
+# 更新为
+STORAGE_PATH = Path("{path/to/ga/storage}")
+TEMP_STORAGE_PATH = Path("{path/to/ga/temp_storage}")
+```
+这样可用实现不改变GA代码情况下，实现仿真数据的对接。不然得修改GA的代码来适配MG的输出路径。  
+
+如果你不想从0开始启动，拷贝`generative_agents/environment/frontend_server/storage/`下的其他仿真目录到`examples/stanford_town/storage`，并选择一个目录名作为`fork_sim_code`。  
+
+### 后端服务启动
+执行入口为：`python3 run_st_game.py "Host a open lunch party at 13:00 pm" "base_the_ville_isabella_maria_klaus" "test_sim" 10`  
+或者  
+`python3 run_st_game.py "Host a open lunch party at 13:00 pm" "base_the_ville_isabella_maria_klaus" "test_sim" 10 --temp_storage_path path/to/ga/temp_storage`
+
+`idea`为用户给第一个Agent的用户心声，并通过这个心声进行传播，看最后多智能体是否达到举办、参加活动的目标。  
+
+### 前端服务启动
+进入`generative_agents`项目目录
+
+进入`environment/frontend_server`，使用`python3 manage.py runserver`启动前端服务。  
+访问`http://localhost:8000/simulator_home` 进入当前的仿真界面。  
+
+## 致谢
+复现工作参考了 [generative_agents](https://github.com/joonspk-research/generative_agents), 感谢相关作者们。
+
+### 引用
+```bib
+@inproceedings{Park2023GenerativeAgents,  
+author = {Park, Joon Sung and O'Brien, Joseph C. and Cai, Carrie J. and Morris, Meredith Ringel and Liang, Percy and Bernstein, Michael S.},  
+title = {Generative Agents: Interactive Simulacra of Human Behavior},  
+year = {2023},  
+publisher = {Association for Computing Machinery},  
+address = {New York, NY, USA},  
+booktitle = {In the 36th Annual ACM Symposium on User Interface Software and Technology (UIST '23)},  
+keywords = {Human-AI interaction, agents, generative AI, large language models},  
+location = {San Francisco, CA, USA},  
+series = {UIST '23}
+}
+```
diff --git a/metagpt/ext/stanford_town/__init__.py b/metagpt/ext/stanford_town/__init__.py
new file mode 100644
index 0000000000..56ea35c9f7
--- /dev/null
+++ b/metagpt/ext/stanford_town/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : stanford town implement
diff --git a/metagpt/ext/stanford_town/actions/__init__.py b/metagpt/ext/stanford_town/actions/__init__.py
new file mode 100644
index 0000000000..2bcf8efd09
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/metagpt/ext/stanford_town/actions/agent_chat_sum_rel.py b/metagpt/ext/stanford_town/actions/agent_chat_sum_rel.py
new file mode 100644
index 0000000000..98d370bb07
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/agent_chat_sum_rel.py
@@ -0,0 +1,39 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : summarize relationship in a agent chat
+
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.logs import logger
+
+
+class AgentChatSumRel(STAction):
+    name: str = "AgentChatSumRel"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        resp = False
+        try:
+            _ = llm_resp.split('"')[0].strip()
+            resp = True
+        except Exception:
+            pass
+        return resp
+
+    def _func_cleanup(self, llm_resp: str, prompt: str) -> str:
+        return llm_resp.split('"')[0].strip()
+
+    def _func_fail_default_resp(self) -> str:
+        pass
+
+    async def run(self, init_role: "STRole", target_role: "STRole", statements: str) -> str:
+        def create_prompt_input(init_role: "STRole", target_role: "STRole", statements: str) -> str:
+            prompt_input = [statements, init_role.name, target_role.name]
+            return prompt_input
+
+        prompt_input = create_prompt_input(init_role, target_role, statements)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "summarize_chat_relationship_v2.txt")
+
+        example_output = "Jane Doe is working on a project"
+        special_instruction = "The output should be a string that responds to the question."
+        output = await self._run_gpt35(prompt, example_output, special_instruction)
+        logger.info(f"Role: {init_role.name} Action: {self.cls_name} output: {output}")
+        return output
diff --git a/metagpt/ext/stanford_town/actions/decide_to_talk.py b/metagpt/ext/stanford_town/actions/decide_to_talk.py
new file mode 100644
index 0000000000..a393f31af7
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/decide_to_talk.py
@@ -0,0 +1,97 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : device to talk to another role, return yes or no
+
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.logs import logger
+
+
+class DecideToTalk(STAction):
+    name: str = "DecideToTalk"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        resp = False
+        try:
+            if llm_resp.split("Answer in yes or no:")[-1].strip().lower() in ["yes", "no"]:
+                resp = True
+        except ValueError:
+            pass
+        return resp
+
+    def _func_cleanup(self, llm_resp: str, prompt: str) -> str:
+        return llm_resp.split("Answer in yes or no:")[-1].strip().lower()
+
+    def _func_fail_default_resp(self) -> str:
+        return "yes"
+
+    async def run(self, init_role: "STRole", target_role: "STRole", retrieved: dict, *args, **kwargs) -> bool:
+        """Run action"""
+
+        def create_prompt_input(init_role: "STRole", target_role: "STRole", retrieved: dict) -> str:
+            scratch = init_role.rc.scratch
+            target_scratch = target_role.rc.scratch
+            last_chat = init_role.rc.memory.get_last_chat(target_role.name)
+            last_chatted_time = ""
+            last_chat_about = ""
+            if last_chat:
+                last_chatted_time = last_chat.created.strftime("%B %d, %Y, %H:%M:%S")
+                last_chat_about = last_chat.description
+
+            context = ""
+            for c_node in retrieved["events"]:
+                curr_desc = c_node.description.split(" ")
+                curr_desc[2:3] = ["was"]
+                curr_desc = " ".join(curr_desc)
+                context += f"{curr_desc}. "
+            context += "\n"
+            for c_node in retrieved["thoughts"]:
+                context += f"{c_node.description}. "
+
+            curr_time = scratch.curr_time.strftime("%B %d, %Y, %H:%M:%S %p")
+            init_act_desc = scratch.act_description
+            if "(" in init_act_desc:
+                init_act_desc = init_act_desc.split("(")[-1][:-1]
+
+            if len(scratch.planned_path) == 0 and "waiting" not in init_act_desc:
+                init_p_desc = f"{init_role.name} is already {init_act_desc}"
+            elif "waiting" in init_act_desc:
+                init_p_desc = f"{init_role.name} is {init_act_desc}"
+            else:
+                init_p_desc = f"{init_role.name} is on the way to {init_act_desc}"
+
+            target_act_desc = scratch.act_description
+            if "(" in target_act_desc:
+                target_act_desc = target_act_desc.split("(")[-1][:-1]
+
+            if len(target_scratch.planned_path) == 0 and "waiting" not in init_act_desc:
+                target_p_desc = f"{target_role.name} is already {target_act_desc}"
+            elif "waiting" in init_act_desc:
+                target_p_desc = f"{init_role.name} is {init_act_desc}"
+            else:
+                target_p_desc = f"{target_role.name} is on the way to {target_act_desc}"
+
+            prompt_input = []
+            prompt_input += [context]
+
+            prompt_input += [curr_time]
+
+            prompt_input += [init_role.name]
+            prompt_input += [target_role.name]
+            prompt_input += [last_chatted_time]
+            prompt_input += [last_chat_about]
+
+            prompt_input += [init_p_desc]
+            prompt_input += [target_p_desc]
+            prompt_input += [init_role.name]
+            prompt_input += [target_role.name]
+            return prompt_input
+
+        prompt_input = create_prompt_input(init_role, target_role, retrieved)
+        prompt = self.generate_prompt_with_tmpl_filename(
+            prompt_input=prompt_input, tmpl_filename="decide_to_talk_v2.txt"
+        )
+        self.fail_default_resp = self._func_fail_default_resp()
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=20)  # yes or no
+        result = True if output == "yes" else False
+        logger.info(f"Role: {init_role.name} Action: {self.cls_name} output: {result}")
+        return result
diff --git a/metagpt/ext/stanford_town/actions/dummy_action.py b/metagpt/ext/stanford_town/actions/dummy_action.py
new file mode 100644
index 0000000000..a5004d5ef3
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/dummy_action.py
@@ -0,0 +1,20 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : dummy action to make every STRole can deal DummyMessage which is caused by DummyAction
+
+from metagpt.actions import Action
+from metagpt.schema import Message
+
+
+class DummyAction(Action):
+    async def run(self, *args, **kwargs):
+        raise NotImplementedError
+
+
+class DummyMessage(Message):
+    """
+    dummy message to pass to role and make them to have a execution every round
+    """
+
+    content: str = "dummy"
+    cause_by: str = "DummyAction"
diff --git a/metagpt/ext/stanford_town/actions/gen_action_details.py b/metagpt/ext/stanford_town/actions/gen_action_details.py
new file mode 100644
index 0000000000..8e268a723a
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/gen_action_details.py
@@ -0,0 +1,401 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : gen_action_details
+
+import random
+
+from metagpt.environment.stanford_town.env_space import EnvObsParams, EnvObsType
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.logs import logger
+
+
+class GenActionSector(STAction):
+    name: str = "GenActionSector"
+
+    def _func_cleanup(self, llm_resp: str, prompt: str):
+        cleaned_response = llm_resp.split("}")[0]
+        return cleaned_response
+
+    def _func_validate(self, llm_resp: str, prompt: str):
+        if len(llm_resp.strip()) < 1:
+            return False
+        if "}" not in llm_resp:
+            return False
+        if "," in llm_resp:
+            return False
+        return True
+
+    def _func_fail_default_resp(self):
+        fs = "kitchen"
+        return fs
+
+    async def run(self, role: "STRole", access_tile: dict[str, str], act_desp: str):
+        def create_prompt_input(role, access_tile: dict[str, str], act_desp):
+            act_world = f"{access_tile['world']}"
+
+            prompt_input = []
+
+            prompt_input += [role.scratch.get_str_name()]
+            prompt_input += [role.scratch.living_area.split(":")[1]]
+            x = f"{act_world}:{role.scratch.living_area.split(':')[1]}"
+            prompt_input += [role.s_mem.get_str_accessible_sector_arenas(x)]
+
+            prompt_input += [role.scratch.get_str_name()]
+            prompt_input += [f"{access_tile['sector']}"]
+            x = f"{act_world}:{access_tile['sector']}"
+            prompt_input += [role.s_mem.get_str_accessible_sector_arenas(x)]
+
+            if role.scratch.get_str_daily_plan_req() != "":
+                prompt_input += [f"\n{role.scratch.get_str_daily_plan_req()}"]
+            else:
+                prompt_input += [""]
+
+            # MAR 11 TEMP
+            prompt_input = []
+            act_world = access_tile["world"]
+            accessible_sector_str = role.s_mem.get_str_accessible_sectors(act_world)
+            curr = accessible_sector_str.split(", ")
+            fin_accessible_sectors = []
+            for i in curr:
+                if "'s house" in i:
+                    if role.scratch.last_name in i:
+                        fin_accessible_sectors += [i]
+            else:
+                fin_accessible_sectors += [i]
+            accessible_sector_str = ", ".join(fin_accessible_sectors)
+            # END MAR 11 TEMP
+
+            prompt_input += [accessible_sector_str]
+
+            act_desp_1 = act_desp
+            act_desp_2 = act_desp
+            if "(" in act_desp:
+                act_desp_1 = act_desp.split("(")[0].strip()
+                act_desp_2 = act_desp.split("(")[-1][:-1]
+            prompt_input += [role.scratch.get_str_name()]
+            prompt_input += [act_desp_1]
+
+            prompt_input += [act_desp_2]
+            prompt_input += [role.scratch.get_str_name()]
+            return prompt_input
+
+        prompt_template = "action_location_sector_v1.txt"
+        prompt_input = create_prompt_input(role, access_tile, act_desp)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, prompt_template)
+
+        self.fail_default_resp = self._func_fail_default_resp()
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=15)
+        y = f"{access_tile['world']}"
+        x = [i.strip() for i in role.s_mem.get_str_accessible_sectors(y).split(",")]
+        if output not in x:
+            # output = random.choice(x)
+            output = role.scratch.living_area.split(":")[1]
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+class GenActionArena(STAction):
+    name: str = "GenActionArena"
+
+    def _func_cleanup(self, llm_resp: str, prompt: str):
+        cleaned_response = llm_resp.split("}")[0]
+        return cleaned_response
+
+    def _func_validate(self, llm_resp: str, prompt: str):
+        if len(llm_resp.strip()) < 1:
+            return False
+        if "}" not in llm_resp:
+            return False
+        if "," in llm_resp:
+            return False
+        return True
+
+    def _func_fail_default_resp(self):
+        fs = "kitchen"
+        return fs
+
+    async def run(self, role: "STRole", act_desp: str, act_world: str, act_sector: str):
+        def create_prompt_input(role, act_desp, act_world, act_sector):
+            prompt_input = []
+            prompt_input += [role.scratch.get_str_name()]
+            x = f"{act_world}:{act_sector}"
+            prompt_input += [act_sector]
+
+            # MAR 11 TEMP
+            accessible_arena_str = role.s_mem.get_str_accessible_sector_arenas(x)
+            curr = accessible_arena_str.split(", ")
+            fin_accessible_arenas = []
+            for i in curr:
+                if "'s room" in i:
+                    if role.scratch.last_name in i:
+                        fin_accessible_arenas += [i]
+                else:
+                    fin_accessible_arenas += [i]
+            accessible_arena_str = ", ".join(fin_accessible_arenas)
+            # END MAR 11 TEMP
+            prompt_input += [accessible_arena_str]
+            act_desp_1 = act_desp
+            act_desp_2 = act_desp
+            if "(" in act_desp:
+                act_desp_1 = act_desp.split("(")[0].strip()
+                act_desp_2 = act_desp.split("(")[-1][:-1]
+            prompt_input += [role.scratch.get_str_name()]
+            prompt_input += [act_desp_1]
+
+            prompt_input += [act_desp_2]
+            prompt_input += [role.scratch.get_str_name()]
+
+            prompt_input += [act_sector]
+            prompt_input += [accessible_arena_str]
+            return prompt_input
+
+        prompt_template = "action_location_object_vMar11.txt"
+        prompt_input = create_prompt_input(role, act_desp, act_world, act_sector)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, prompt_template)
+        self.fail_default_resp = self._func_fail_default_resp()
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=15)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+class GenActionObject(STAction):
+    name: str = "GenActionObject"
+
+    def _func_validate(self, llm_resp: str, prompt: str):
+        if len(llm_resp.strip()) < 1:
+            return False
+        return True
+
+    def _func_cleanup(self, llm_resp: str, prompt: str):
+        cleaned_response = llm_resp.strip()
+        return cleaned_response
+
+    def _func_fail_default_resp(self):
+        fs = "bed"
+        return fs
+
+    async def run(self, role: "STRole", act_desp: str, temp_address: str):
+        def create_prompt_input(role, act_desp, temp_address):
+            prompt_input = []
+            if "(" in act_desp:
+                act_desp = act_desp.split("(")[-1][:-1]
+
+            prompt_input += [act_desp]
+            prompt_input += [role.s_mem.get_str_accessible_arena_game_objects(temp_address)]
+            return prompt_input
+
+        prompt_template = "action_object_v2.txt"
+        prompt_input = create_prompt_input(role, act_desp, temp_address)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, prompt_template)
+        self.fail_default_resp = self._func_fail_default_resp()
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=15)
+        x = [i.strip() for i in role.s_mem.get_str_accessible_arena_game_objects(temp_address).split(",")]
+        if output not in x:
+            output = random.choice(x)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+class GenPronunciatio(STAction):
+    name: str = "GenPronunciatio"
+
+    def _func_cleanup(self, llm_resp: str, prompt: str):
+        cr = llm_resp.strip()
+        if len(cr) > 3:
+            cr = cr[:3]
+        return cr
+
+    def _func_validate(self, llm_resp: str, prompt: str):
+        try:
+            self._func_cleanup(llm_resp, prompt="")
+            if len(llm_resp) == 0:
+                return False
+        except Exception:
+            return False
+        return True
+
+    def _func_fail_default_resp(self):
+        fs = "😋"
+        return fs
+
+    async def run(self, role: "STRole", act_desp: str):
+        def create_prompt_input(act_desp):
+            if "(" in act_desp:
+                act_desp = act_desp.split("(")[-1].split(")")[0]
+            prompt_input = [act_desp]
+            return prompt_input
+
+        prompt_template = "generate_pronunciatio_v1.txt"
+        prompt_input = create_prompt_input(act_desp)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, prompt_template)
+        example_output = "🛁🧖‍♀️"
+        special_instruction = "The value for the output must ONLY contain the emojis."
+        self.fail_default_resp = self._func_fail_default_resp()
+        output = await self._run_gpt35(prompt, example_output, special_instruction)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+class GenEventTriple(STAction):
+    name: str = "GenEventTriple"
+
+    def _func_cleanup(self, llm_resp: str, prompt: str):
+        cr = llm_resp.strip()
+        cr = [i.strip() for i in cr.split(")")[0].split(",")]
+        return cr
+
+    def _func_validate(self, llm_resp: str, prompt: str):
+        try:
+            llm_resp = self._func_cleanup(llm_resp, prompt="")
+            if len(llm_resp) != 2:
+                return False
+        except Exception:
+            return False
+        return True
+
+    def _func_fail_default_resp(self, role):
+        fs = (role.name, "is", "idle")
+        return fs
+
+    async def run(self, role: "STRole", act_desp: str):
+        def create_prompt_input(role, act_desp):
+            if "(" in act_desp:
+                act_desp = act_desp.split("(")[-1].split(")")[0]
+            prompt_input = [role.name, act_desp, role.name]
+            return prompt_input
+
+        prompt_template = "generate_event_triple_v1.txt"
+        prompt_input = create_prompt_input(role, act_desp)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, prompt_template)
+        self.fail_default_resp = self._func_fail_default_resp(role)
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=30)
+        output = (role.name, output[0], output[1])
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+class GenActObjDescription(STAction):
+    name: str = "GenActObjDescription"
+
+    def _func_cleanup(self, llm_resp: str, prompt: str):
+        cr = llm_resp.strip()
+        if cr[-1] == ".":
+            cr = cr[:-1]
+        return cr
+
+    def _func_validate(self, llm_resp: str, prompt: str):
+        try:
+            llm_resp = self._func_cleanup(llm_resp, prompt="")
+        except Exception:
+            return False
+        return True
+
+    def _func_fail_default_resp(self, act_game_object):
+        fs = f"{act_game_object} is idle"
+        return fs
+
+    async def run(self, role: "STRole", act_game_object: str, act_desp: str):
+        def create_prompt_input(act_game_object, act_desp, role):
+            prompt_input = [act_game_object, role.name, act_desp, act_game_object, act_game_object]
+            return prompt_input
+
+        prompt_template = "generate_obj_event_v1.txt"
+        prompt_input = create_prompt_input(act_game_object, act_desp, role)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, prompt_template)
+        example_output = "being fixed"
+        special_instruction = "The output should ONLY contain the phrase that should go in <fill in>."
+        self.fail_default_resp = self._func_fail_default_resp(act_game_object)
+        output = await self._run_gpt35(prompt, example_output, special_instruction)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+class GenObjEventTriple(STAction):
+    name: str = "GenObjEventTriple"
+
+    def _func_cleanup(self, llm_resp: str, prompt: str):
+        cr = llm_resp.strip()
+        cr = [i.strip() for i in cr.split(")")[0].split(",")]
+        return cr
+
+    def _func_validate(self, llm_resp: str, prompt: str):
+        try:
+            llm_resp = self._func_cleanup(llm_resp, prompt="")
+            if len(llm_resp) != 2:
+                return False
+        except Exception:
+            return False
+        return True
+
+    def _func_fail_default_resp(self, act_game_object: str):
+        fs = (act_game_object, "is", "idle")
+        return fs
+
+    async def run(self, role: "STRole", act_game_object, act_obj_desp):
+        def create_prompt_input(act_game_object, act_obj_desp):
+            prompt_input = [act_game_object, act_obj_desp, act_game_object]
+            return prompt_input
+
+        prompt_template = "generate_event_triple_v1.txt"
+        prompt_input = create_prompt_input(act_game_object, act_obj_desp)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, prompt_template)
+        self.fail_default_resp = self._func_fail_default_resp(act_game_object)
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=30)
+        output = (act_game_object, output[0], output[1])
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+class GenActionDetails(STAction):
+    name: str = "GenActionDetails"
+
+    def _func_cleanup(self, llm_resp: str, prompt: str) -> list:
+        pass
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        # TODO -- this sometimes generates error
+        try:
+            self._func_cleanup(llm_resp)
+        except Exception:
+            return False
+        return True
+
+    def _func_fail_default_resp(self):
+        fs = {}
+        return fs
+
+    async def run(self, role: "STRole", act_desp: str, act_dura):
+        access_tile = role.rc.env.observe(
+            obs_params=EnvObsParams(obs_type=EnvObsType.GET_TITLE, coord=role.scratch.curr_tile)
+        )
+        act_world = access_tile["world"]
+        act_sector = await GenActionSector().run(role, access_tile, act_desp)
+        act_arena = await GenActionArena().run(role, act_desp, act_world, act_sector)
+        act_address = f"{act_world}:{act_sector}:{act_arena}"
+        if not role.s_mem.get_str_accessible_arena_game_objects(act_address):
+            act_game_object = "<random>"
+        else:
+            act_game_object = await GenActionObject().run(role, act_desp, act_address)
+        new_address = f"{act_world}:{act_sector}:{act_arena}:{act_game_object}"
+        act_pron = await GenPronunciatio().run(role, act_desp)
+        act_event = await GenEventTriple().run(role, act_desp)
+        # Persona's actions also influence the object states. We set those up here.
+        act_obj_desp = await GenActObjDescription().run(role, act_game_object, act_desp)
+        act_obj_pron = await GenPronunciatio().run(role, act_obj_desp)
+        act_obj_event = await GenObjEventTriple().run(role, act_game_object, act_obj_desp)
+        result_dict = {
+            "action_address": new_address,
+            "action_duration": int(act_dura),
+            "action_description": act_desp,
+            "action_pronunciatio": act_pron,
+            "action_event": act_event,
+            "chatting_with": None,
+            "chat": None,
+            "chatting_with_buffer": None,
+            "chatting_end_time": None,
+            "act_obj_description": act_obj_desp,
+            "act_obj_pronunciatio": act_obj_pron,
+            "act_obj_event": act_obj_event,
+        }
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {result_dict}")
+        return result_dict
diff --git a/metagpt/ext/stanford_town/actions/gen_daily_schedule.py b/metagpt/ext/stanford_town/actions/gen_daily_schedule.py
new file mode 100644
index 0000000000..5dffa89952
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/gen_daily_schedule.py
@@ -0,0 +1,60 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : gen_daily_schedule
+
+
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.logs import logger
+
+
+class GenDailySchedule(STAction):
+    name: str = "GenDailySchedule"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        try:
+            self._func_cleanup(llm_resp, prompt="")
+        except Exception:
+            return False
+        return True
+
+    def _func_cleanup(self, llm_resp: str, prompt: str) -> list:
+        cr = []
+        _cr = llm_resp.split(")")
+        for i in _cr:
+            if i[-1].isdigit():
+                i = i[:-1].strip()
+                if i[-1] == "." or i[-1] == ",":
+                    cr += [i[:-1].strip()]
+        return cr
+
+    def _func_fail_default_resp(self) -> int:
+        fs = [
+            "wake up and complete the morning routine at 6:00 am",
+            "eat breakfast at 7:00 am",
+            "read a book from 8:00 am to 12:00 pm",
+            "have lunch at 12:00 pm",
+            "take a nap from 1:00 pm to 4:00 pm",
+            "relax and watch TV from 7:00 pm to 8:00 pm",
+            "go to bed at 11:00 pm",
+        ]
+        return fs
+
+    async def run(self, role: "STRole", wake_up_hour: str):
+        def create_prompt_input(role, wake_up_hour):
+            prompt_input = []
+            prompt_input += [role.scratch.get_str_iss()]
+            prompt_input += [role.scratch.get_str_lifestyle()]
+            prompt_input += [role.scratch.get_str_curr_date_str()]
+            prompt_input += [role.scratch.get_str_firstname()]
+            prompt_input += [f"{str(wake_up_hour)}:00 am"]
+            return prompt_input
+
+        wake_up_hour = int(wake_up_hour)
+        prompt_template = "daily_planning_v6.txt"
+        prompt_input = create_prompt_input(role, wake_up_hour)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, prompt_template)
+        self.fail_default_resp = self._func_fail_default_resp()
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=500)
+        output = [f"wake up and complete the morning routine at {wake_up_hour}:00 am"] + output
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
diff --git a/metagpt/ext/stanford_town/actions/gen_hourly_schedule.py b/metagpt/ext/stanford_town/actions/gen_hourly_schedule.py
new file mode 100644
index 0000000000..5d59f96dda
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/gen_hourly_schedule.py
@@ -0,0 +1,181 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : gen_hourly_schedule
+
+import random
+import string
+
+from metagpt.logs import logger
+
+from .st_action import STAction
+
+
+def get_random_alphanumeric(i=6, j=6):
+    """
+    Returns a random alpha numeric strength that has the length of somewhere
+    between i and j.
+
+    INPUT:
+        i: min_range for the length
+        j: max_range for the length
+    OUTPUT:
+        an alpha numeric str with the length of somewhere between i and j.
+    """
+    k = random.randint(i, j)
+    x = "".join(random.choices(string.ascii_letters + string.digits, k=k))
+    return x
+
+
+class GenHourlySchedule(STAction):
+    name: str = "GenHourlySchedule"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        try:
+            self._func_cleanup(llm_resp, prompt="")
+        except Exception:
+            return False
+        return True
+
+    def _func_cleanup(self, llm_resp: str, prompt: str) -> list:
+        cr = llm_resp.strip()
+        if cr[-1] == ".":
+            cr = cr[:-1]
+        # to only use the first line of output
+        cr = cr.split("\n")[0]
+        return cr
+
+    def _func_fail_default_resp(self) -> int:
+        fs = "asleep"
+        return fs
+
+    async def _generate_schedule_for_given_hour(
+        self, role: "STRole", curr_hour_str, p_f_ds_hourly_org, hour_str, intermission2=None
+    ):
+        def create_prompt_input(persona, curr_hour_str, p_f_ds_hourly_org, hour_str, intermission2=None):
+            schedule_format = ""
+            for i in hour_str:
+                schedule_format += f"[{persona.scratch.get_str_curr_date_str()} -- {i}]"
+                schedule_format += " Activity: [Fill in]\n"
+            schedule_format = schedule_format[:-1]
+
+            intermission_str = "Here the originally intended hourly breakdown of"
+            intermission_str += f" {persona.scratch.get_str_firstname()}'s schedule today: "
+            for count, i in enumerate(persona.scratch.daily_req):
+                intermission_str += f"{str(count + 1)}) {i}, "
+            intermission_str = intermission_str[:-2]
+
+            prior_schedule = ""
+            if p_f_ds_hourly_org:
+                prior_schedule = "\n"
+                for count, i in enumerate(p_f_ds_hourly_org):
+                    prior_schedule += f"[(ID:{get_random_alphanumeric()})"
+                    prior_schedule += f" {persona.scratch.get_str_curr_date_str()} --"
+                    prior_schedule += f" {hour_str[count]}] Activity:"
+                    prior_schedule += f" {persona.scratch.get_str_firstname()}"
+                    prior_schedule += f" is {i}\n"
+
+            prompt_ending = f"[(ID:{get_random_alphanumeric()})"
+            prompt_ending += f" {persona.scratch.get_str_curr_date_str()}"
+            prompt_ending += f" -- {curr_hour_str}] Activity:"
+            prompt_ending += f" {persona.scratch.get_str_firstname()} is"
+
+            if intermission2:
+                intermission2 = f"\n{intermission2}"
+
+            prompt_input = []
+            prompt_input += [schedule_format]
+            prompt_input += [persona.scratch.get_str_iss()]
+
+            prompt_input += [prior_schedule + "\n"]
+            prompt_input += [intermission_str]
+            if intermission2:
+                prompt_input += [intermission2]
+            else:
+                prompt_input += [""]
+                prompt_input += [prompt_ending]
+
+            return prompt_input
+
+        prompt_template = "generate_hourly_schedule_v2.txt"
+        prompt_input = create_prompt_input(role, curr_hour_str, p_f_ds_hourly_org, hour_str, intermission2)
+        prompt_input_str = "\n".join(prompt_input)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, prompt_template)
+        self.fail_default_resp = self._func_fail_default_resp()
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=50)
+        logger.info(
+            f"Role: {role.name} _generate_schedule_for_given_hour prompt_input: {prompt_input_str}, "
+            f"output: {output}"
+        )
+        return output
+
+    async def run(self, role: "STRole", wake_up_hour: int):
+        hour_str = [
+            "00:00 AM",
+            "01:00 AM",
+            "02:00 AM",
+            "03:00 AM",
+            "04:00 AM",
+            "05:00 AM",
+            "06:00 AM",
+            "07:00 AM",
+            "08:00 AM",
+            "09:00 AM",
+            "10:00 AM",
+            "11:00 AM",
+            "12:00 PM",
+            "01:00 PM",
+            "02:00 PM",
+            "03:00 PM",
+            "04:00 PM",
+            "05:00 PM",
+            "06:00 PM",
+            "07:00 PM",
+            "08:00 PM",
+            "09:00 PM",
+            "10:00 PM",
+            "11:00 PM",
+        ]
+        n_m1_activity = []
+        diversity_repeat_count = 1  # TODO mg 1->3
+        for i in range(diversity_repeat_count):
+            logger.info(f"diversity_repeat_count idx: {i}")
+            n_m1_activity_set = set(n_m1_activity)
+            if len(n_m1_activity_set) < 5:
+                n_m1_activity = []
+                for count, curr_hour_str in enumerate(hour_str):
+                    if wake_up_hour > 0:
+                        n_m1_activity += ["sleeping"]
+                        wake_up_hour -= 1
+                    else:
+                        logger.info(f"_generate_schedule_for_given_hour idx: {count}, n_m1_activity: {n_m1_activity}")
+                        n_m1_activity += [
+                            await self._generate_schedule_for_given_hour(role, curr_hour_str, n_m1_activity, hour_str)
+                        ]
+
+        # Step 1. Compressing the hourly schedule to the following format:
+        # The integer indicates the number of hours. They should add up to 24.
+        # [['sleeping', 6], ['waking up and starting her morning routine', 1],
+        # ['eating breakfast', 1], ['getting ready for the day', 1],
+        # ['working on her painting', 2], ['taking a break', 1],
+        # ['having lunch', 1], ['working on her painting', 3],
+        # ['taking a break', 2], ['working on her painting', 2],
+        # ['relaxing and watching TV', 1], ['going to bed', 1], ['sleeping', 2]]
+        _n_m1_hourly_compressed = []
+        prev = None
+        prev_count = 0
+        for i in n_m1_activity:
+            if i != prev:
+                prev_count = 1
+                _n_m1_hourly_compressed += [[i, prev_count]]
+                prev = i
+            elif _n_m1_hourly_compressed:
+                _n_m1_hourly_compressed[-1][1] += 1
+
+        # Step 2. Expand to min scale (from hour scale)
+        # [['sleeping', 360], ['waking up and starting her morning routine', 60],
+        # ['eating breakfast', 60],..
+        n_m1_hourly_compressed = []
+        for task, duration in _n_m1_hourly_compressed:
+            n_m1_hourly_compressed += [[task, duration * 60]]
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {n_m1_hourly_compressed}")
+        return n_m1_hourly_compressed
diff --git a/metagpt/ext/stanford_town/actions/gen_iter_chat_utt.py b/metagpt/ext/stanford_town/actions/gen_iter_chat_utt.py
new file mode 100644
index 0000000000..40f6d3af0e
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/gen_iter_chat_utt.py
@@ -0,0 +1,125 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : generate_iterative_chat_utt
+
+from metagpt.environment.stanford_town.env_space import EnvObsParams, EnvObsType
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.ext.stanford_town.utils.utils import extract_first_json_dict
+from metagpt.logs import logger
+
+
+class GenIterChatUTT(STAction):
+    name: str = "GenIterChatUTT"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        resp = False
+        try:
+            _ = extract_first_json_dict(llm_resp)
+            resp = True
+        except Exception:
+            pass
+        return resp
+
+    def _func_cleanup(self, llm_resp: str, prompt: str) -> dict:
+        gpt_response = extract_first_json_dict(llm_resp)
+
+        cleaned_dict = dict()
+        cleaned = []
+        for key, val in gpt_response.items():
+            cleaned += [val]
+        cleaned_dict["utterance"] = cleaned[0]
+        cleaned_dict["end"] = True
+        if "f" in str(cleaned[1]) or "F" in str(cleaned[1]):
+            cleaned_dict["end"] = False
+
+        return cleaned_dict
+
+    def _func_fail_default_resp(self) -> dict:
+        cleaned_dict = dict()
+        cleaned_dict["utterance"] = "..."
+        cleaned_dict["end"] = False
+        return cleaned_dict
+
+    async def run(
+        self,
+        init_role: "STRole",
+        target_role: "STRole",
+        retrieved: dict,
+        curr_context: str,
+        curr_chat: list[str],
+        *args,
+        **kwargs,
+    ) -> dict:
+        def create_prompt_input(
+            access_tile: dict[str, str],
+            init_role: "STRole",
+            target_role: "STRole",
+            retrieved: dict,
+            curr_context: str,
+            curr_chat: list[str],
+        ):
+            role = init_role
+            scratch = role.rc.scratch
+            target_scratch = target_role.rc.scratch
+            prev_convo_insert = "\n"
+            if role.rc.memory.chat_list:
+                for i in role.rc.memory.chat_list:
+                    if i.object == target_role.name:
+                        v1 = int((scratch.curr_time - i.created).total_seconds() / 60)
+                        prev_convo_insert += (
+                            f"{str(v1)} minutes ago, {scratch.name} and "
+                            f"{target_scratch.name} were already {i.description} "
+                            f"This context takes place after that conversation."
+                        )
+                        break
+            if prev_convo_insert == "\n":
+                prev_convo_insert = ""
+            if role.rc.memory.chat_list:
+                if int((scratch.curr_time - role.rc.memory.chat_list[-1].created).total_seconds() / 60) > 480:
+                    prev_convo_insert = ""
+            logger.info(f"prev_convo_insert: {prev_convo_insert}")
+
+            curr_sector = f"{access_tile['sector']}"
+            curr_arena = f"{access_tile['arena']}"
+            curr_location = f"{curr_arena} in {curr_sector}"
+
+            retrieved_str = ""
+            for key, vals in retrieved.items():
+                for v in vals:
+                    retrieved_str += f"- {v.description}\n"
+
+            convo_str = ""
+            for i in curr_chat:
+                convo_str += ": ".join(i) + "\n"
+            if convo_str == "":
+                convo_str = "[The conversation has not started yet -- start it!]"
+
+            init_iss = f"Here is Here is a brief description of {scratch.name}.\n{scratch.get_str_iss()}"
+            prompt_input = [
+                init_iss,
+                scratch.name,
+                retrieved_str,
+                prev_convo_insert,
+                curr_location,
+                curr_context,
+                scratch.name,
+                target_scratch.name,
+                convo_str,
+                scratch.name,
+                target_scratch.name,
+                scratch.name,
+                scratch.name,
+                scratch.name,
+            ]
+            return prompt_input
+
+        access_tile = init_role.rc.env.observe(
+            obs_params=EnvObsParams(obs_type=EnvObsType.GET_TITLE, coord=init_role.scratch.curr_tile)
+        )
+        prompt_input = create_prompt_input(access_tile, init_role, target_role, retrieved, curr_context, curr_chat)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "iterative_convo_v1.txt")
+        # original using `ChatGPT_safe_generate_response_OLD`
+        self.fail_default_resp = self._func_fail_default_resp()
+        output = await self._run_gpt35_wo_extra_prompt(prompt)
+        logger.info(f"Role: {init_role.name} Action: {self.cls_name} output: {output}")
+        return output
diff --git a/metagpt/ext/stanford_town/actions/inner_voice_action.py b/metagpt/ext/stanford_town/actions/inner_voice_action.py
new file mode 100644
index 0000000000..83cfa037ba
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/inner_voice_action.py
@@ -0,0 +1,35 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
+
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.logs import logger
+
+
+class AgentWhisperThoughtAction(STAction):
+    name: str = "AgentWhisperThoughtAction"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        try:
+            self._func_cleanup(llm_resp, prompt)
+            return True
+        except Exception:
+            return False
+
+    def _func_cleanup(self, llm_resp: str, prompt: str = "") -> list:
+        return llm_resp.split('"')[0].strip()
+
+    def _func_fail_default_resp(self) -> str:
+        pass
+
+    async def run(self, role: "STRole", statements: str, test_input=None, verbose=False) -> str:
+        def create_prompt_input(role: "STRole", statements, test_input=None):
+            prompt_input = [role.scratch.name, statements]
+            return prompt_input
+
+        prompt_input = create_prompt_input(role, statements)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "whisper_inner_thought_v1.txt")
+
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=50)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
diff --git a/metagpt/ext/stanford_town/actions/new_decomp_schedule.py b/metagpt/ext/stanford_town/actions/new_decomp_schedule.py
new file mode 100644
index 0000000000..759ec170f4
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/new_decomp_schedule.py
@@ -0,0 +1,154 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : new_decomp_schedule
+
+import datetime
+
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.logs import logger
+
+
+class NewDecompSchedule(STAction):
+    name: str = "NewDecompSchedule"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        resp = False
+        try:
+            llm_resp = self._func_cleanup(llm_resp, prompt)
+            dur_sum = 0
+            for act, dur in llm_resp:
+                dur_sum += dur
+                if isinstance(act, str):
+                    return False
+                if isinstance(dur, int):
+                    return False
+            x = prompt.split("\n")[0].split("originally planned schedule from")[-1].strip()[:-1]
+            x = [datetime.datetime.strptime(i.strip(), "%H:%M %p") for i in x.split(" to ")]
+            delta_min = int((x[1] - x[0]).total_seconds() / 60)
+
+            if int(dur_sum) != int(delta_min):
+                return False
+        except Exception:
+            pass
+        return resp
+
+    def _func_cleanup(self, llm_resp: str, prompt: str) -> list:
+        new_schedule = prompt + " " + llm_resp.strip()
+        new_schedule = new_schedule.split("The revised schedule:")[-1].strip()
+        new_schedule = new_schedule.split("\n")
+
+        ret_temp = []
+        for i in new_schedule:
+            ret_temp += [i.split(" -- ")]
+
+        ret = []
+        for time_str, action in ret_temp:
+            start_time = time_str.split(" ~ ")[0].strip()
+            end_time = time_str.split(" ~ ")[1].strip()
+            delta = datetime.datetime.strptime(end_time, "%H:%M") - datetime.datetime.strptime(start_time, "%H:%M")
+            delta_min = int(delta.total_seconds() / 60)
+            if delta_min < 0:
+                delta_min = 0
+            ret += [[action, delta_min]]
+
+        return ret
+
+    def _func_fail_default_resp(self, main_act_dur: int, truncated_act_dur: int) -> int:
+        dur_sum = 0
+        for act, dur in main_act_dur:
+            dur_sum += dur
+
+        ret = truncated_act_dur[:]
+        ret += main_act_dur[len(ret) - 1 :]
+
+        # If there are access, we need to trim...
+        ret_dur_sum = 0
+        count = 0
+        over = None
+        for act, dur in ret:
+            ret_dur_sum += dur
+            if ret_dur_sum == dur_sum:
+                break
+            if ret_dur_sum > dur_sum:
+                over = ret_dur_sum - dur_sum
+                break
+            count += 1
+
+        if over:
+            ret = ret[: count + 1]
+            ret[-1][1] -= over
+
+        return ret
+
+    async def run(
+        self,
+        role: "STRole",
+        main_act_dur: int,
+        truncated_act_dur: int,
+        start_time_hour: datetime,
+        end_time_hour: datetime,
+        inserted_act: str,
+        inserted_act_dur: int,
+        *args,
+        **kwargs,
+    ):
+        def create_prompt_input(
+            role: "STRole",
+            main_act_dur: int,
+            truncated_act_dur: int,
+            start_time_hour: datetime,
+            end_time_hour: datetime,
+            inserted_act: str,
+            inserted_act_dur: int,
+        ):
+            persona_name = role.name
+            start_hour_str = start_time_hour.strftime("%H:%M %p")
+            end_hour_str = end_time_hour.strftime("%H:%M %p")
+
+            original_plan = ""
+            for_time = start_time_hour
+            for i in main_act_dur:
+                original_plan += (
+                    f'{for_time.strftime("%H:%M")} ~ '
+                    f'{(for_time + datetime.timedelta(minutes=int(i[1]))).strftime("%H:%M")} -- ' + i[0]
+                )
+                original_plan += "\n"
+                for_time += datetime.timedelta(minutes=int(i[1]))
+
+            new_plan_init = ""
+            for_time = start_time_hour
+            for count, i in enumerate(truncated_act_dur):
+                new_plan_init += (
+                    f'{for_time.strftime("%H:%M")} ~ '
+                    f'{(for_time + datetime.timedelta(minutes=int(i[1]))).strftime("%H:%M")} -- ' + i[0]
+                )
+                new_plan_init += "\n"
+                if count < len(truncated_act_dur) - 1:
+                    for_time += datetime.timedelta(minutes=int(i[1]))
+
+            new_plan_init += (for_time + datetime.timedelta(minutes=int(i[1]))).strftime("%H:%M") + " ~"
+
+            prompt_input = [
+                persona_name,
+                start_hour_str,
+                end_hour_str,
+                original_plan,
+                persona_name,
+                inserted_act,
+                inserted_act_dur,
+                persona_name,
+                start_hour_str,
+                end_hour_str,
+                end_hour_str,
+                new_plan_init,
+            ]
+            return prompt_input
+
+        prompt_input = create_prompt_input(
+            role, main_act_dur, truncated_act_dur, start_time_hour, end_time_hour, inserted_act, inserted_act_dur
+        )
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "new_decomp_schedule_v1.txt")
+        self.fail_default_resp = self._func_fail_default_resp(main_act_dur, truncated_act_dur)
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=1000)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
diff --git a/metagpt/ext/stanford_town/actions/run_reflect_action.py b/metagpt/ext/stanford_town/actions/run_reflect_action.py
new file mode 100644
index 0000000000..895f6828f0
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/run_reflect_action.py
@@ -0,0 +1,277 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : Integration Reflect Action
+
+import re
+
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.logs import logger
+
+
+# Run GPT Prompt Focal Point method
+class AgentFocusPt(STAction):
+    name: str = "AgentFocusPt"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        try:
+            self._func_cleanup(llm_resp, prompt)
+            return True
+        except Exception:
+            return False
+
+    def _func_cleanup(self, llm_resp: str, prompt: str = "") -> str:
+        try:
+            """
+            Cleanup handling has been completed for run_v2
+            """
+            return llm_resp
+        except Exception as exp:
+            logger.error(f"{self.cls_name} with error {exp}")
+
+    def _func_fail_default_resp(self) -> str:
+        pass
+
+    async def run(self, role: "STRole", statements: str, n: int, test_input=None) -> str:
+        def create_prompt_input(role: "STRole", statements, n, test_input=None):
+            prompt_input = [statements, str(n)]
+            return prompt_input
+
+        prompt_input = create_prompt_input(role, statements, n)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "generate_focal_pt_v1.txt")
+
+        example_output = '["What should Jane do for lunch", "Does Jane like strawberry", "Who is Jane"]'
+        special_instruction = "Output must be a list of str."
+        output = await self._run_gpt35(prompt, example_output, special_instruction)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+# Run GPT Prompt Insight and Guidance
+class AgentInsightAndGuidance(STAction):
+    name: str = "AgentInsightAndGuidance"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        try:
+            self._func_cleanup(llm_resp, prompt)
+            return True
+        except Exception:
+            return False
+
+    def _func_cleanup(self, llm_resp: str, prompt: str = "") -> dict:
+        try:
+            llm_resp = "1. " + llm_resp.strip()
+            ret = dict()
+            for i in llm_resp.split("\n"):
+                row = " ".join(i.split(". ")[1:])
+                if "(because of " not in row:
+                    continue
+                thought = row.split("(because of ")[0].strip()
+                if ")" not in row.split("(because of ")[1]:
+                    continue
+                evi_raw = row.split("(because of ")[1].split(")")[0].strip()
+                evi_raw = re.findall(r"\d+", evi_raw)
+                evi_raw = [int(i.strip()) for i in evi_raw]
+                ret[thought] = evi_raw
+            return ret
+        except Exception as exp:
+            logger.error(f"{self.cls_name} with error {exp}")
+
+    def _func_fail_default_resp(self, n: int) -> str:
+        return ["I am hungry"] * n
+
+    async def run(self, role: "STRole", statements: str, n: int, test_input=None) -> dict:
+        def create_prompt_input(role, statements, n, test_input=None):
+            prompt_input = [statements, str(n)]
+            return prompt_input
+
+        prompt_input = create_prompt_input(role, statements, n)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "insight_and_evidence_v1.txt")
+
+        self.fail_default_resp = self._func_fail_default_resp(n)
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=150)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+# Run GPT Prompt Event Triple
+class AgentEventTriple(STAction):
+    name: str = "AgentEventTriple"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        try:
+            llm_resp = self._func_cleanup(llm_resp, prompt="")
+            if len(llm_resp) != 2:
+                return False
+        except Exception:
+            return False
+        return True
+
+    def _func_cleanup(self, llm_resp: str, prompt: str = "") -> list:
+        try:
+            cr = llm_resp.strip()
+            cr = [i.strip() for i in cr.split(")")[0].split(",")]
+            if len(cr) != 2:
+                return cr[-2:]
+            return cr
+        except Exception as exp:
+            logger.error(f"{self.cls_name} with error {exp}")
+
+    def _func_fail_default_resp(self) -> str:
+        pass
+
+    async def run(self, statements: str, role: "STRole", verbose=False) -> tuple:
+        def create_prompt_input(statements, role):
+            if "(" in statements:
+                statements = statements.split("(")[-1].split(")")[0]
+            prompt_input = [role.scratch.name, statements, role.scratch.name]
+            return prompt_input
+
+        prompt_input = create_prompt_input(statements, role)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "generate_event_triple_v1.txt")
+
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=30)
+        output = (role.scratch.name, output[0], output[1])
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+# Run GPT Prompt Event Poignancy
+class AgentEventPoignancy(STAction):
+    name: str = "AgentEventPoignancy"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        try:
+            self._func_cleanup(llm_resp, prompt)
+            return True
+        except Exception:
+            return False
+
+    def _func_cleanup(self, llm_resp: str, prompt: str = "") -> int:
+        try:
+            llm_resp = int(llm_resp.strip())
+            return llm_resp
+        except Exception as exp:
+            logger.error(f"{self.cls_name} with error {exp}")
+
+    def _func_fail_default_resp(self) -> str:
+        pass
+
+    async def run(self, role: "STRole", statements: str, test_input=None, verbose=False) -> str:
+        def create_prompt_input(role: "STRole", statements: str, test_input=None):
+            prompt_input = [role.scratch.name, role.scratch.get_str_iss(), role.scratch.name, statements]
+            return prompt_input
+
+        prompt_input = create_prompt_input(role, statements)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "poignancy_event_v1.txt")
+
+        example_output = "5"  # ########
+        special_instruction = "The output should ONLY contain ONE integer value on the scale of 1 to 10."
+        output = await self._run_gpt35(prompt, example_output, special_instruction)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+# Run GPT Prompt Chat Poignancy
+class AgentChatPoignancy(STAction):
+    name: str = "AgentChatPoignancy"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        try:
+            self._func_cleanup(llm_resp, prompt)
+            return True
+        except Exception:
+            return False
+
+    def _func_cleanup(self, llm_resp: str, prompt: str = "") -> int:
+        try:
+            llm_resp = int(llm_resp.strip())
+            return llm_resp
+        except Exception as exp:
+            logger.error(f"{self.cls_name} with error {exp}")
+
+    def _func_fail_default_resp(self) -> str:
+        pass
+
+    async def run(self, role: "STRole", statements: str, test_input=None, verbose=False) -> str:
+        def create_prompt_input(role: "STRole", statements, test_input=None):
+            prompt_input = [role.scratch.name, role.scratch.get_str_iss(), role.scratch.name, statements]
+            return prompt_input
+
+        prompt_input = create_prompt_input(role, statements)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "poignancy_chat_v1.txt")
+
+        example_output = "5"  # ########
+        special_instruction = "The output should ONLY contain ONE integer value on the scale of 1 to 10."
+        output = await self._run_gpt35(prompt, example_output, special_instruction)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+# Run GPT Prompt Planning Thought on Convo
+class AgentPlanThoughtOnConvo(STAction):
+    name: str = "AgentPlanThoughtOnConvo"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        try:
+            self._func_cleanup(llm_resp, prompt)
+            return True
+        except Exception:
+            return False
+
+    def _func_cleanup(self, llm_resp: str, prompt: str = "") -> str:
+        try:
+            return llm_resp.split('"')[0].strip()
+        except Exception as exp:
+            logger.error(f"{self.cls_name} with error {exp}")
+
+    def _func_fail_default_resp(self) -> str:
+        pass
+
+    async def run(self, role: "STRole", statements: str, test_input=None, verbose=False) -> str:
+        def create_prompt_input(role, statements, test_input=None):
+            prompt_input = [statements, role.scratch.name, role.scratch.name, role.scratch.name]
+            return prompt_input
+
+        prompt_input = create_prompt_input(role, statements)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "planning_thought_on_convo_v1.txt")
+
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=50)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+# Run GPT Prompt Memory on Convo
+class AgentMemoryOnConvo(STAction):
+    name: str = "AgentMemoryOnConvo"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        try:
+            self._func_cleanup(llm_resp, prompt)
+            return True
+        except Exception:
+            return False
+
+    def _func_cleanup(self, llm_resp: str, prompt: str = "") -> str:
+        try:
+            return llm_resp.split('"')[0].strip()
+        except Exception as exp:
+            logger.error(f"{self.cls_name} with error {exp}")
+
+    def _func_fail_default_resp(self) -> str:
+        pass
+
+    async def run(self, role: "STRole", statements: str, test_input=None, verbose=False) -> str:
+        def create_prompt_input(role, statements, test_input=None):
+            prompt_input = [statements, role.scratch.name, role.scratch.name, role.scratch.name]
+            return prompt_input
+
+        prompt_input = create_prompt_input(role, statements)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "memo_on_convo_v1.txt")
+        example_output = "Jane Doe was interesting to talk to."
+        special_instruction = (
+            "The output should ONLY contain a string that summarizes anything interesting "
+            "that the agent may have noticed"
+        )
+        output = await self._run_gpt35(prompt, example_output, special_instruction)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
diff --git a/metagpt/ext/stanford_town/actions/st_action.py b/metagpt/ext/stanford_town/actions/st_action.py
new file mode 100644
index 0000000000..321676374d
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/st_action.py
@@ -0,0 +1,119 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : StanfordTown Action
+import json
+import time
+from abc import abstractmethod
+from pathlib import Path
+from typing import Any, Optional, Union
+
+from metagpt.actions.action import Action
+from metagpt.config2 import config
+from metagpt.ext.stanford_town.utils.const import PROMPTS_DIR
+from metagpt.logs import logger
+
+
+class STAction(Action):
+    name: str = "STAction"
+    prompt_dir: Path = PROMPTS_DIR
+    fail_default_resp: Optional[str] = None
+
+    @property
+    def cls_name(self):
+        return self.__class__.__name__
+
+    @abstractmethod
+    def _func_validate(self, llm_resp: str, prompt: str):
+        raise NotImplementedError
+
+    @abstractmethod
+    def _func_cleanup(self, llm_resp: str, prompt: str):
+        raise NotImplementedError
+
+    @abstractmethod
+    def _func_fail_default_resp(self):
+        raise NotImplementedError
+
+    def generate_prompt_with_tmpl_filename(self, prompt_input: Union[str, list], tmpl_filename) -> str:
+        """
+        same with `generate_prompt`
+        Args:
+            prompt_input: the input we want to feed in (IF THERE ARE MORE THAN ONE INPUT, THIS CAN BE A LIST.)
+            tmpl_filename: prompt template filename
+        Returns:
+            a str prompt that will be sent to LLM server.
+        """
+        if isinstance(prompt_input, str):
+            prompt_input = [prompt_input]
+        prompt_input = [str(i) for i in prompt_input]
+
+        f = open(str(self.prompt_dir.joinpath(tmpl_filename)), "r")
+        prompt = f.read()
+        f.close()
+        for count, i in enumerate(prompt_input):
+            prompt = prompt.replace(f"!<INPUT {count}>!", i)
+        if "<commentblockmarker>###</commentblockmarker>" in prompt:
+            prompt = prompt.split("<commentblockmarker>###</commentblockmarker>")[1]
+        return prompt.strip()
+
+    async def _aask(self, prompt: str) -> str:
+        return await self.llm.aask(prompt)
+
+    async def _run_gpt35_max_tokens(self, prompt: str, max_tokens: int = 50, retry: int = 3):
+        for idx in range(retry):
+            try:
+                tmp_max_tokens_rsp = getattr(config.llm, "max_token", 1500)
+                setattr(config.llm, "max_token", max_tokens)
+                self.llm.use_system_prompt = False  # to make it behave like a non-chat completions
+
+                llm_resp = await self._aask(prompt)
+
+                setattr(config.llm, "max_token", tmp_max_tokens_rsp)
+                logger.info(f"Action: {self.cls_name} llm _run_gpt35_max_tokens raw resp: {llm_resp}")
+                if self._func_validate(llm_resp, prompt):
+                    return self._func_cleanup(llm_resp, prompt)
+            except Exception as exp:
+                logger.warning(f"Action: {self.cls_name} _run_gpt35_max_tokens exp: {exp}")
+                time.sleep(5)
+        return self.fail_default_resp
+
+    async def _run_gpt35(
+        self, prompt: str, example_output: str, special_instruction: str, retry: int = 3
+    ) -> Union[bool, Any]:
+        """same with `gpt_structure.ChatGPT_safe_generate_response`"""
+        prompt = '"""\n' + prompt + '\n"""\n'
+        prompt += f"Output the response to the prompt above in json. {special_instruction}\n"
+        prompt += "Example output json:\n"
+        prompt += '{"output": "' + str(example_output) + '"}'
+
+        for idx in range(retry):
+            try:
+                llm_resp = await self._aask(prompt)
+                logger.info(f"Action: {self.cls_name} llm _run_gpt35 raw resp: {llm_resp}")
+                end_idx = llm_resp.strip().rfind("}") + 1
+                llm_resp = llm_resp[:end_idx]
+                llm_resp = json.loads(llm_resp)["output"]
+
+                if self._func_validate(llm_resp, prompt):
+                    return self._func_cleanup(llm_resp, prompt)
+            except Exception as exp:
+                logger.warning(f"Action: {self.cls_name} _run_gpt35 exp: {exp}")
+                time.sleep(5)  # usually avoid `Rate limit`
+        return False
+
+    async def _run_gpt35_wo_extra_prompt(self, prompt: str, retry: int = 3) -> str:
+        for idx in range(retry):
+            try:
+                llm_resp = await self._aask(prompt)
+                llm_resp = llm_resp.strip()
+                logger.info(f"Action: {self.cls_name} llm _run_gpt35_wo_extra_prompt raw resp: {llm_resp}")
+                if self._func_validate(llm_resp, prompt):
+                    return self._func_cleanup(llm_resp, prompt)
+            except Exception as exp:
+                logger.warning(f"Action: {self.cls_name} _run_gpt35_wo_extra_prompt exp: {exp}")
+                time.sleep(5)  # usually avoid `Rate limit`
+        return self.fail_default_resp
+
+    async def run(self, *args, **kwargs):
+        """Run action"""
+        raise NotImplementedError("The run method should be implemented in a subclass.")
diff --git a/metagpt/ext/stanford_town/actions/summarize_conv.py b/metagpt/ext/stanford_town/actions/summarize_conv.py
new file mode 100644
index 0000000000..5be5fcaa43
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/summarize_conv.py
@@ -0,0 +1,47 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : summarize the content of agents' conversation
+
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.logs import logger
+
+
+class SummarizeConv(STAction):
+    name: str = "SummarizeConv"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        resp = False
+        try:
+            _ = self._func_cleanup(llm_resp, prompt)
+            resp = True
+        except Exception:
+            pass
+        return resp
+
+    def _func_cleanup(self, llm_resp: str, prompt: str) -> str:
+        ret = "conversing about " + llm_resp.strip()
+        return ret
+
+    def _func_fail_default_resp(self) -> str:
+        return "conversing with a housemate about morning greetings"
+
+    async def run(self, conv: list):
+        def create_prompt_input(conversation: list):
+            convo_str = ""
+            for row in conversation:
+                convo_str += f'{row[0]}: "{row[1]}"\n'
+            prompt_input = [convo_str]
+            return prompt_input
+
+        prompt_input = create_prompt_input(conv)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "summarize_conversation_v1.txt")
+
+        example_output = "conversing about what to eat for lunch"
+        special_instruction = (
+            "The output must continue the sentence above by filling in the <fill in> tag. "
+            "Don't start with 'this is a conversation about...' Just finish the sentence "
+            "but do not miss any important details (including who are chatting)."
+        )
+        output = await self._run_gpt35(prompt, example_output, special_instruction)
+        logger.info(f"Action: {self.cls_name} output: {output}")
+        return output
diff --git a/metagpt/ext/stanford_town/actions/task_decomp.py b/metagpt/ext/stanford_town/actions/task_decomp.py
new file mode 100644
index 0000000000..3a23a73456
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/task_decomp.py
@@ -0,0 +1,173 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : task_decomp
+
+import datetime
+
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.logs import logger
+
+
+class TaskDecomp(STAction):
+    name: str = "TaskDecomp"
+
+    def _func_cleanup(self, llm_resp: str, prompt: str) -> list:
+        # TODO SOMETHING HERE sometimes fails... See screenshot
+        temp = [i.strip() for i in llm_resp.split("\n")]
+        _cr = []
+        cr = []
+        for count, i in enumerate(temp):
+            if count != 0:
+                _cr += [" ".join([j.strip() for j in i.split(" ")][3:])]
+            else:
+                _cr += [i]
+        for count, i in enumerate(_cr):
+            k = [j.strip() for j in i.split("(duration in minutes:")]
+            task = k[0]
+            if task[-1] == ".":
+                task = task[:-1]
+            duration = int(k[1].split(",")[0].strip())
+            cr += [[task, duration]]
+
+        total_expected_min = int(prompt.split("(total duration in minutes")[-1].split("):")[0].strip())
+
+        # TODO -- now, you need to make sure that this is the same as the sum of
+        #         the current action sequence.
+        curr_min_slot = [
+            ["dummy", -1],
+        ]  # (task_name, task_index)
+        for count, i in enumerate(cr):
+            i_task = i[0]
+            i_duration = i[1]
+
+            i_duration -= i_duration % 5
+            if i_duration > 0:
+                for j in range(i_duration):
+                    curr_min_slot += [(i_task, count)]
+        curr_min_slot = curr_min_slot[1:]
+
+        if len(curr_min_slot) > total_expected_min:
+            last_task = curr_min_slot[60]
+            for i in range(1, 6):
+                curr_min_slot[-1 * i] = last_task
+        elif len(curr_min_slot) < total_expected_min:
+            last_task = curr_min_slot[-1]
+            for i in range(total_expected_min - len(curr_min_slot)):
+                curr_min_slot += [last_task]
+
+        cr_ret = [
+            ["dummy", -1],
+        ]
+        for task, task_index in curr_min_slot:
+            if task != cr_ret[-1][0]:
+                cr_ret += [[task, 1]]
+            else:
+                cr_ret[-1][1] += 1
+        cr = cr_ret[1:]
+
+        return cr
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        # TODO -- this sometimes generates error
+        try:
+            self._func_cleanup(llm_resp, prompt)
+        except Exception:
+            return False
+        return True
+
+    def _func_fail_default_resp(self) -> int:
+        fs = [["asleep", 0]]
+        return fs
+
+    async def run(self, role: "STRole", task_desc: int, truncated_act_dur: int, *args, **kwargs):
+        def create_prompt_input(role, task, duration):
+            """
+            Today is Saturday June 25. From 00:00 ~ 06:00am, Maeve is
+            planning on sleeping, 06:00 ~ 07:00am, Maeve is
+            planning on waking up and doing her morning routine,
+            and from 07:00am ~08:00am, Maeve is planning on having breakfast.
+            """
+
+            curr_f_org_index = role.scratch.get_f_daily_schedule_hourly_org_index()
+            all_indices = []
+            # if curr_f_org_index > 0:
+            #   all_indices += [curr_f_org_index-1]
+            all_indices += [curr_f_org_index]
+            if curr_f_org_index + 1 <= len(role.scratch.f_daily_schedule_hourly_org):
+                all_indices += [curr_f_org_index + 1]
+            if curr_f_org_index + 2 <= len(role.scratch.f_daily_schedule_hourly_org):
+                all_indices += [curr_f_org_index + 2]
+
+            curr_time_range = ""
+
+            logger.debug("DEBUG")
+            logger.debug(role.scratch.f_daily_schedule_hourly_org)
+            logger.debug(all_indices)
+
+            summ_str = f'Today is {role.scratch.curr_time.strftime("%B %d, %Y")}. '
+            summ_str += "From "
+            for index in all_indices:
+                logger.debug(f"index {index}")
+                if index < len(role.scratch.f_daily_schedule_hourly_org):
+                    start_min = 0
+                    for i in range(index):
+                        start_min += role.scratch.f_daily_schedule_hourly_org[i][1]
+                        end_min = start_min + role.scratch.f_daily_schedule_hourly_org[index][1]
+                        start_time = datetime.datetime.strptime("00:00:00", "%H:%M:%S") + datetime.timedelta(
+                            minutes=start_min
+                        )
+                        end_time = datetime.datetime.strptime("00:00:00", "%H:%M:%S") + datetime.timedelta(
+                            minutes=end_min
+                        )
+                        start_time_str = start_time.strftime("%H:%M%p")
+                        end_time_str = end_time.strftime("%H:%M%p")
+                        summ_str += (
+                            f"{start_time_str} ~ {end_time_str}, {role.name} is planning "
+                            f"on {role.scratch.f_daily_schedule_hourly_org[index][0]}, "
+                        )
+                        if curr_f_org_index + 1 == index:
+                            curr_time_range = f"{start_time_str} ~ {end_time_str}"
+            summ_str = summ_str[:-2] + "."
+
+            prompt_input = []
+            prompt_input += [role.scratch.get_str_iss()]
+            prompt_input += [summ_str]
+            # prompt_input += [role.scratch.get_str_curr_date_str()]
+            prompt_input += [role.scratch.get_str_firstname()]
+            prompt_input += [role.scratch.get_str_firstname()]
+            prompt_input += [task]
+            prompt_input += [curr_time_range]
+            prompt_input += [duration]
+            prompt_input += [role.scratch.get_str_firstname()]
+            return prompt_input
+
+        prompt_input = create_prompt_input(role, task_desc, truncated_act_dur)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "task_decomp_v3.txt")
+        self.fail_default_resp = self._func_fail_default_resp()
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=1000)
+        logger.info(f"Role: {role.name} {self.cls_name} output: {output}")
+
+        fin_output = []
+        time_sum = 0
+        for i_task, i_duration in output:
+            time_sum += i_duration
+            # HM?????????
+            # if time_sum < duration:
+            if time_sum <= truncated_act_dur:
+                fin_output += [[i_task, i_duration]]
+            else:
+                break
+        ftime_sum = 0
+        for fi_task, fi_duration in fin_output:
+            ftime_sum += fi_duration
+
+        fin_output[-1][1] += truncated_act_dur - ftime_sum
+        output = fin_output
+
+        task_decomp = output
+        ret = []
+        for decomp_task, duration in task_decomp:
+            ret += [[f"{task_desc} ({decomp_task})", duration]]
+        output = ret
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
diff --git a/metagpt/ext/stanford_town/actions/wake_up.py b/metagpt/ext/stanford_town/actions/wake_up.py
new file mode 100644
index 0000000000..ea44cd3a42
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/wake_up.py
@@ -0,0 +1,42 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : wake_up
+
+
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.logs import logger
+
+
+class WakeUp(STAction):
+    name: str = "WakeUp"
+
+    def _func_validate(self, llm_resp: str, prompt: str = None) -> bool:
+        try:
+            self._func_cleanup(llm_resp, prompt="")
+        except Exception:
+            return False
+        return True
+
+    def _func_cleanup(self, llm_resp: str, prompt: str) -> int:
+        cr = int(llm_resp.strip().lower().split("am")[0])
+        return cr
+
+    def _func_fail_default_resp(self) -> int:
+        fs = 8
+        return fs
+
+    async def run(self, role: "STRole"):
+        def create_prompt_input(role):
+            prompt_input = [
+                role.scratch.get_str_iss(),
+                role.scratch.get_str_lifestyle(),
+                role.scratch.get_str_firstname(),
+            ]
+            return prompt_input
+
+        prompt_input = create_prompt_input(role)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "wake_up_hour_v1.txt")
+        self.fail_default_resp = self._func_fail_default_resp()
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=5)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
diff --git a/metagpt/ext/stanford_town/memory/__init__.py b/metagpt/ext/stanford_town/memory/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/metagpt/ext/stanford_town/memory/agent_memory.py b/metagpt/ext/stanford_town/memory/agent_memory.py
new file mode 100644
index 0000000000..d212232f42
--- /dev/null
+++ b/metagpt/ext/stanford_town/memory/agent_memory.py
@@ -0,0 +1,378 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : BasicMemory,AgentMemory实现
+
+from datetime import datetime
+from pathlib import Path
+from typing import Optional
+
+from pydantic import Field, field_serializer, model_validator
+
+from metagpt.logs import logger
+from metagpt.memory.memory import Memory
+from metagpt.schema import Message
+from metagpt.utils.common import read_json_file, write_json_file
+
+
+class BasicMemory(Message):
+    """
+    BasicMemory继承于MG的Message类，其中content属性替代description属性
+    Message类中对于Chat类型支持的非常好，对于Agent个体的Perceive,Reflection,Plan支持的并不多
+    在Type设计上，我们延续GA的三个种类，但是对于Chat种类的对话进行特别设计（具体怎么设计还没想好）
+    """
+
+    memory_id: Optional[str] = Field(default=None)  # 记忆ID
+    memory_count: int = -1  # 第几个记忆，实际数值与Memory相等
+    type_count: int = -1  # 第几种记忆，类型为整数
+    memory_type: Optional[str] = Field(default=None)  # 记忆类型，包含 event,thought,chat三种类型
+    depth: int = -1  # 记忆深度，类型为整数
+    created: Optional[datetime] = Field(default=None)  # 创建时间
+    expiration: Optional[datetime] = Field(default=None)  # 记忆失效时间，默认为空（）
+    last_accessed: Optional[datetime] = Field(default=None)  # 上一次调用的时间，初始化时候与self.created一致
+    subject: Optional[str] = Field(default=None)  # 主语
+    predicate: Optional[str] = Field(default=None)  # 谓语
+    object: Optional[str] = Field(default=None)  # 宾语
+
+    description: Optional[str] = Field(default=None)
+    embedding_key: Optional[str] = Field(default=None)  # 内容与self.content一致
+    poignancy: int = -1  # importance值
+    keywords: list[str] = Field(default=[])  # keywords
+    filling: list = Field(default=[])  # 装的与之相关联的memory_id的列表
+
+    __hash__ = object.__hash__  # support hash in AgentMemory
+
+    @model_validator(mode="before")
+    @classmethod
+    def check_values(cls, values):
+        if "created" in values:
+            values["last_accessed"] = values["created"]
+        if "content" in values:
+            values["description"] = values["content"]
+        if "filling" in values:
+            values["filling"] = values["filling"] or []
+        return values
+
+    @field_serializer("created", "expiration")
+    def transform_time_field(self, time_field: Optional[datetime]) -> str:
+        if time_field:
+            time_field = time_field.strftime("%Y-%m-%d %H:%M:%S")
+        return time_field
+
+    def summary(self):
+        return self.subject, self.predicate, self.object
+
+    def save_to_dict(self) -> dict:
+        """
+        将MemoryBasic类转化为字典，用于存储json文件
+        这里需要注意，cause_by跟GA不兼容，所以需要做一个格式转换
+        """
+        memory_dict = dict()
+        node_id = self.memory_id
+        basic_mem_obj = self.model_dump(
+            include=[
+                "node_count",
+                "type_count",
+                "type",
+                "depth",
+                "created",
+                "expiration",
+                "subject",
+                "predicate",
+                "object",
+                "description",
+                "embedding_key",
+                "poignancy",
+                "keywords",
+                "filling",
+                "cause_by",
+            ]
+        )
+
+        memory_dict[node_id] = basic_mem_obj
+        return memory_dict
+
+
+class AgentMemory(Memory):
+    """
+    GA中主要存储三种JSON
+    1. embedding.json (Dict embedding_key:embedding)
+    2. Node.json (Dict Node_id:Node)
+    3. kw_strength.json
+    """
+
+    storage: list[BasicMemory] = []  # 重写Storage，存储BasicMemory所有节点
+    event_list: list[BasicMemory] = []  # 存储event记忆
+    thought_list: list[BasicMemory] = []  # 存储thought记忆
+    chat_list: list[BasicMemory] = []  # chat-related memory
+
+    event_keywords: dict[str, list[BasicMemory]] = dict()  # 存储keywords
+    thought_keywords: dict[str, list[BasicMemory]] = dict()
+    chat_keywords: dict[str, list[BasicMemory]] = dict()
+
+    kw_strength_event: dict[str, int] = dict()
+    kw_strength_thought: dict[str, int] = dict()
+
+    memory_saved: Optional[Path] = Field(default=None)
+    embeddings: dict[str, list[float]] = dict()
+
+    def set_mem_path(self, memory_saved: Path):
+        self.memory_saved = memory_saved
+        self.load(memory_saved)
+
+    def save(self, memory_saved: Path):
+        """
+        将MemoryBasic类存储为Nodes.json形式。复现GA中的Kw Strength.json形式
+        这里添加一个路径即可
+        TODO 这里在存储时候进行倒序存储，之后需要验证（test_memory通过）
+        """
+        memory_json = dict()
+        for i in range(len(self.storage)):
+            memory_node = self.storage[len(self.storage) - i - 1]
+            memory_node = memory_node.save_to_dict()
+            memory_json.update(memory_node)
+        write_json_file(memory_saved.joinpath("nodes.json"), memory_json)
+        write_json_file(memory_saved.joinpath("embeddings.json"), self.embeddings)
+
+        strength_json = dict()
+        strength_json["kw_strength_event"] = self.kw_strength_event
+        strength_json["kw_strength_thought"] = self.kw_strength_thought
+        write_json_file(memory_saved.joinpath("kw_strength.json"), strength_json)
+
+    def load(self, memory_saved: Path):
+        """
+        将GA的JSON解析，填充到AgentMemory类之中
+        """
+        self.embeddings = read_json_file(memory_saved.joinpath("embeddings.json"))
+        memory_load = read_json_file(memory_saved.joinpath("nodes.json"))
+        for count in range(len(memory_load.keys())):
+            node_id = f"node_{str(count + 1)}"
+            node_details = memory_load[node_id]
+            node_type = node_details["type"]
+            created = datetime.strptime(node_details["created"], "%Y-%m-%d %H:%M:%S")
+            expiration = None
+            if node_details["expiration"]:
+                expiration = datetime.strptime(node_details["expiration"], "%Y-%m-%d %H:%M:%S")
+
+            s = node_details["subject"]
+            p = node_details["predicate"]
+            o = node_details["object"]
+
+            description = node_details["description"]
+            embedding_pair = (node_details["embedding_key"], self.embeddings[node_details["embedding_key"]])
+            poignancy = node_details["poignancy"]
+            keywords = set(node_details["keywords"])
+            filling = node_details["filling"]
+            if node_type == "thought":
+                self.add_thought(
+                    created, expiration, s, p, o, description, keywords, poignancy, embedding_pair, filling
+                )
+            if node_type == "event":
+                self.add_event(created, expiration, s, p, o, description, keywords, poignancy, embedding_pair, filling)
+            if node_type == "chat":
+                self.add_chat(created, expiration, s, p, o, description, keywords, poignancy, embedding_pair, filling)
+
+        strength_keywords_load = read_json_file(memory_saved.joinpath("kw_strength.json"))
+        if strength_keywords_load["kw_strength_event"]:
+            self.kw_strength_event = strength_keywords_load["kw_strength_event"]
+        if strength_keywords_load["kw_strength_thought"]:
+            self.kw_strength_thought = strength_keywords_load["kw_strength_thought"]
+
+    def add(self, memory_basic: BasicMemory):
+        """
+        Add a new message to storage, while updating the index
+        重写add方法，修改原有的Message类为BasicMemory类，并添加不同的记忆类型添加方式
+        """
+        if memory_basic.memory_id in self.storage:
+            return
+        self.storage.append(memory_basic)
+        if memory_basic.memory_type == "chat":
+            self.chat_list[0:0] = [memory_basic]
+            return
+        if memory_basic.memory_type == "thought":
+            self.thought_list[0:0] = [memory_basic]
+            return
+        if memory_basic.memory_type == "event":
+            self.event_list[0:0] = [memory_basic]
+            return
+
+    def add_chat(
+        self, created, expiration, s, p, o, content, keywords, poignancy, embedding_pair, filling, cause_by=""
+    ):
+        """
+        调用add方法，初始化chat，在创建的时候就需要调用embedding函数
+        """
+        memory_count = len(self.storage) + 1
+        type_count = len(self.thought_list) + 1
+        memory_type = "chat"
+        memory_id = f"node_{str(memory_count)}"
+        depth = 1
+
+        memory_node = BasicMemory(
+            memory_id=memory_id,
+            memory_count=memory_count,
+            type_count=type_count,
+            memory_type=memory_type,
+            depth=depth,
+            created=created,
+            expiration=expiration,
+            subject=s,
+            predicate=p,
+            object=o,
+            description=content,
+            embedding_key=embedding_pair[0],
+            poignancy=poignancy,
+            keywords=keywords,
+            filling=filling,
+            cause_by=cause_by,
+        )
+
+        keywords = [i.lower() for i in keywords]
+        for kw in keywords:
+            if kw in self.chat_keywords:
+                self.chat_keywords[kw][0:0] = [memory_node]
+            else:
+                self.chat_keywords[kw] = [memory_node]
+
+        self.add(memory_node)
+
+        self.embeddings[embedding_pair[0]] = embedding_pair[1]
+        return memory_node
+
+    def add_thought(self, created, expiration, s, p, o, content, keywords, poignancy, embedding_pair, filling):
+        """
+        调用add方法，初始化thought
+        """
+        memory_count = len(self.storage) + 1
+        type_count = len(self.thought_list) + 1
+        memory_type = "thought"
+        memory_id = f"node_{str(memory_count)}"
+        depth = 1
+
+        try:
+            if filling:
+                depth_list = [memory_node.depth for memory_node in self.storage if memory_node.memory_id in filling]
+                depth += max(depth_list)
+        except Exception as exp:
+            logger.warning(f"filling init occur {exp}")
+            pass
+
+        memory_node = BasicMemory(
+            memory_id=memory_id,
+            memory_count=memory_count,
+            type_count=type_count,
+            memory_type=memory_type,
+            depth=depth,
+            created=created,
+            expiration=expiration,
+            subject=s,
+            predicate=p,
+            object=o,
+            description=content,
+            embedding_key=embedding_pair[0],
+            poignancy=poignancy,
+            keywords=keywords,
+            filling=filling,
+        )
+
+        keywords = [i.lower() for i in keywords]
+        for kw in keywords:
+            if kw in self.thought_keywords:
+                self.thought_keywords[kw][0:0] = [memory_node]
+            else:
+                self.thought_keywords[kw] = [memory_node]
+
+        self.add(memory_node)
+
+        if f"{p} {o}" != "is idle":
+            for kw in keywords:
+                if kw in self.kw_strength_thought:
+                    self.kw_strength_thought[kw] += 1
+                else:
+                    self.kw_strength_thought[kw] = 1
+
+        self.embeddings[embedding_pair[0]] = embedding_pair[1]
+        return memory_node
+
+    def add_event(self, created, expiration, s, p, o, content, keywords, poignancy, embedding_pair, filling):
+        """
+        调用add方法，初始化event
+        """
+        memory_count = len(self.storage) + 1
+        type_count = len(self.event_list) + 1
+        memory_type = "event"
+        memory_id = f"node_{str(memory_count)}"
+        depth = 0
+
+        if "(" in content:
+            content = " ".join(content.split()[:3]) + " " + content.split("(")[-1][:-1]
+
+        memory_node = BasicMemory(
+            memory_id=memory_id,
+            memory_count=memory_count,
+            type_count=type_count,
+            memory_type=memory_type,
+            depth=depth,
+            created=created,
+            expiration=expiration,
+            subject=s,
+            predicate=p,
+            object=o,
+            description=content,
+            embedding_key=embedding_pair[0],
+            poignancy=poignancy,
+            keywords=keywords,
+            filling=filling,
+        )
+
+        keywords = [i.lower() for i in keywords]
+        for kw in keywords:
+            if kw in self.event_keywords:
+                self.event_keywords[kw][0:0] = [memory_node]
+            else:
+                self.event_keywords[kw] = [memory_node]
+
+        self.add(memory_node)
+
+        if f"{p} {o}" != "is idle":
+            for kw in keywords:
+                if kw in self.kw_strength_event:
+                    self.kw_strength_event[kw] += 1
+                else:
+                    self.kw_strength_event[kw] = 1
+
+        self.embeddings[embedding_pair[0]] = embedding_pair[1]
+        return memory_node
+
+    def get_summarized_latest_events(self, retention):
+        ret_set = set()
+        for e_node in self.event_list[:retention]:
+            ret_set.add(e_node.summary())
+        return ret_set
+
+    def get_last_chat(self, target_role_name: str):
+        if target_role_name.lower() in self.chat_keywords:
+            return self.chat_keywords[target_role_name.lower()][0]
+        else:
+            return False
+
+    def retrieve_relevant_thoughts(self, s_content: str, p_content: str, o_content: str) -> set:
+        contents = [s_content, p_content, o_content]
+
+        ret = []
+        for i in contents:
+            if i in self.thought_keywords:
+                ret += self.thought_keywords[i.lower()]
+
+        ret = set(ret)
+        return ret
+
+    def retrieve_relevant_events(self, s_content: str, p_content: str, o_content: str) -> set:
+        contents = [s_content, p_content, o_content]
+
+        ret = []
+        for i in contents:
+            if i in self.event_keywords:
+                ret += self.event_keywords[i]
+
+        ret = set(ret)
+        return ret
diff --git a/metagpt/ext/stanford_town/memory/retrieve.py b/metagpt/ext/stanford_town/memory/retrieve.py
new file mode 100644
index 0000000000..c4b32f9650
--- /dev/null
+++ b/metagpt/ext/stanford_town/memory/retrieve.py
@@ -0,0 +1,180 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : Retrieve函数实现
+
+import datetime
+
+from numpy import dot
+from numpy.linalg import norm
+
+from metagpt.ext.stanford_town.memory.agent_memory import BasicMemory
+from metagpt.ext.stanford_town.utils.utils import get_embedding
+
+
+def agent_retrieve(
+    agent_memory,
+    curr_time: datetime.datetime,
+    memory_forget: float,
+    query: str,
+    nodes: list[BasicMemory],
+    topk: int = 4,
+) -> list[BasicMemory]:
+    """
+    Retrieve需要集合Role使用,原因在于Role才具有AgentMemory,scratch
+    逻辑:Role调用该函数,self.rc.AgentMemory,self.rc.scratch.curr_time,self.rc.scratch.memory_forget
+    输入希望查询的内容与希望回顾的条数,返回TopK条高分记忆，即List[BasicMemory]
+
+    Score_lists示例
+    {
+        "memory": memories[i],             BasicMemory类
+        "importance": memories[i].poignancy
+        "recency": 衰减因子计算结果
+        "relevance": 搜索结果
+    }
+    """
+    memories = nodes
+    agent_memory_embedding = agent_memory.embeddings
+    memories = sorted(memories, key=lambda memory_node: memory_node.last_accessed, reverse=True)
+
+    score_list = []
+    score_list = extract_importance(memories, score_list)
+    score_list = extract_recency(curr_time, memory_forget, score_list)
+    score_list = extract_relevance(agent_memory_embedding, query, score_list)
+    score_list = normalize_score_floats(score_list, 0, 1)
+
+    total_dict = {}
+    gw = [1, 1, 1]  # 三个因素的权重,重要性,近因性,相关性,
+    for i in range(len(score_list)):
+        total_score = (
+            score_list[i]["importance"] * gw[0] + score_list[i]["recency"] * gw[1] + score_list[i]["relevance"] * gw[2]
+        )
+        total_dict[score_list[i]["memory"].memory_id] = total_score
+
+    result = top_highest_x_values(total_dict, topk)
+
+    return result  # 返回的是一个BasicMemory列表
+
+
+def new_agent_retrieve(role, focus_points: list, n_count=30) -> dict:
+    """
+    输入为role，关注点列表,返回记忆数量
+    输出为字典，键为focus_point，值为对应的记忆列表
+    """
+    retrieved = dict()
+    for focal_pt in focus_points:
+        nodes = [
+            [i.last_accessed, i]
+            for i in role.memory.event_list + role.memory.thought_list
+            if "idle" not in i.embedding_key
+        ]
+        nodes = sorted(nodes, key=lambda x: x[0])
+        nodes = [i for created, i in nodes]
+        results = agent_retrieve(
+            role.memory, role.scratch.curr_time, role.scratch.recency_decay, focal_pt, nodes, n_count
+        )
+        final_result = []
+        for n in results:
+            for i in role.memory.storage:
+                if i.memory_id == n:
+                    i.last_accessed = role.scratch.curr_time
+                    final_result.append(i)
+
+        retrieved[focal_pt] = final_result
+
+    return retrieved
+
+
+def top_highest_x_values(d, x):
+    """
+    输入字典，Topx
+    返回以字典值排序，字典键组成的List[BasicMemory]
+    """
+    top_v = [item[0] for item in sorted(d.items(), key=lambda item: item[1], reverse=True)[:x]]
+    return top_v
+
+
+def extract_importance(memories, score_list):
+    """
+    抽取重要性
+    """
+    for i in range(len(memories)):
+        score = {"memory": memories[i], "importance": memories[i].poignancy}
+        score_list.append(score)
+    return score_list
+
+
+def extract_relevance(agent_memory_embedding, query, score_list):
+    """
+    抽取相关性
+    """
+    query_embedding = get_embedding(query)
+    # 进行
+    for i in range(len(score_list)):
+        node_embedding = agent_memory_embedding[score_list[i]["memory"].embedding_key]
+        result = cos_sim(node_embedding, query_embedding)
+        score_list[i]["relevance"] = result
+
+    return score_list
+
+
+def extract_recency(curr_time, memory_forget, score_list):
+    """
+    抽取近因性，目前使用的现实世界过一天走一个衰减因子
+    """
+    for i in range(len(score_list)):
+        day_count = (curr_time - score_list[i]["memory"].created).days
+        score_list[i]["recency"] = memory_forget**day_count
+    return score_list
+
+
+def cos_sim(a, b):
+    """
+    计算余弦相似度
+    """
+    return dot(a, b) / (norm(a) * norm(b))
+
+
+def normalize_list_floats(single_list, target_min, target_max):
+    """
+    单个列表归一化
+    """
+    if len(single_list) == 0:
+        return []
+
+    min_val = min(single_list)
+    max_val = max(single_list)
+    range_val = max_val - min_val
+
+    if range_val == 0:
+        for i in range(len(single_list)):
+            single_list[i] = (target_max - target_min) / 2
+    else:
+        for i in range(len(single_list)):
+            single_list[i] = (single_list[i] - min_val) * (target_max - target_min) / range_val + target_min
+    return single_list
+
+
+def normalize_score_floats(score_list, target_min, target_max):
+    """
+    整体归一化
+    """
+    importance_list = []
+    relevance_list = []
+    recency_list = []
+
+    for i in range(len(score_list)):
+        importance_list.append(score_list[i]["importance"])
+        relevance_list.append(score_list[i]["relevance"])
+        recency_list.append(score_list[i]["recency"])
+
+    # 进行归一化操作
+    importance_list = normalize_list_floats(importance_list, target_min, target_max)
+    relevance_list = normalize_list_floats(relevance_list, target_min, target_max)
+    recency_list = normalize_list_floats(recency_list, target_min, target_max)
+
+    for i in range(len(score_list)):
+        score_list[i]["importance"] = importance_list[i]
+        score_list[i]["relevance"] = relevance_list[i]
+        score_list[i]["recency"] = recency_list[i]
+
+    return score_list
diff --git a/metagpt/ext/stanford_town/memory/scratch.py b/metagpt/ext/stanford_town/memory/scratch.py
new file mode 100644
index 0000000000..b4036f839f
--- /dev/null
+++ b/metagpt/ext/stanford_town/memory/scratch.py
@@ -0,0 +1,383 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : Scratch类实现（角色信息类）
+
+from datetime import datetime, timedelta
+from pathlib import Path
+from typing import Optional, Union
+
+from pydantic import BaseModel, Field, field_serializer, field_validator
+
+from metagpt.utils.common import read_json_file, write_json_file
+
+
+class Scratch(BaseModel):
+    # 类别1:人物超参
+    vision_r: int = 4
+    att_bandwidth: int = 3
+    retention: int = 5
+
+    # 类别2:世界信息
+    curr_time: Optional[datetime] = Field(default=None)
+    curr_tile: Optional[list[int]] = Field(default=None)
+    daily_plan_req: Optional[str] = Field(default=None)
+
+    # 类别3:人物角色的核心身份
+    name: Optional[str] = Field(default=None)
+    first_name: Optional[str] = Field(default=None)
+    last_name: Optional[str] = Field(default=None)
+    age: Optional[int] = Field(default=None)
+    innate: Optional[str] = Field(default=None)  # L0 permanent core traits.
+    learned: Optional[str] = Field(default=None)  # L1 stable traits.
+    currently: Optional[str] = Field(default=None)  # L2 external implementation.
+    lifestyle: Optional[str] = Field(default=None)
+    living_area: Optional[str] = Field(default=None)
+
+    # 类别4:旧反思变量
+    concept_forget: int = 100
+    daily_reflection_time: int = 60 * 3
+    daily_reflection_size: int = 5
+    overlap_reflect_th: int = 2
+    kw_strg_event_reflect_th: int = 4
+    kw_strg_thought_reflect_th: int = 4
+
+    # 类别5:新反思变量
+    recency_w: int = 1
+    relevance_w: int = 1
+    importance_w: int = 1
+    recency_decay: float = 0.99
+    importance_trigger_max: int = 150
+    importance_trigger_curr: int = 150
+    importance_ele_n: int = 0
+    thought_count: int = 5
+
+    # 类别6:个人计划
+    daily_req: list[str] = Field(default=[])
+    f_daily_schedule: list[list[Union[int, str]]] = Field(default=[])
+    f_daily_schedule_hourly_org: list[list[Union[int, str]]] = Field(default=[])
+
+    # 类别7:当前动作
+    act_address: Optional[str] = Field(default=None)
+    act_start_time: Optional[datetime] = Field(default=None)
+    act_duration: Optional[int] = Field(default=None)
+    act_description: Optional[str] = Field(default=None)
+    act_pronunciatio: Optional[str] = Field(default=None)
+    act_event: list[Optional[str]] = [None, None, None]
+
+    act_obj_description: Optional[str] = Field(default=None)
+    act_obj_pronunciatio: Optional[str] = Field(default=None)
+    act_obj_event: list[Optional[str]] = [None, None, None]
+
+    chatting_with: Optional[str] = Field(default=None)
+    chat: Optional[str] = Field(default=None)
+    chatting_with_buffer: dict = dict()
+    chatting_end_time: Optional[datetime] = Field(default=None)
+
+    act_path_set: bool = False
+    planned_path: list[list[int]] = Field(default=[])
+
+    @field_validator("curr_time", "act_start_time", "chatting_end_time", mode="before")
+    @classmethod
+    def check_time_filed(cls, time_filed):
+        val = datetime.strptime(time_filed, "%B %d, %Y, %H:%M:%S") if time_filed else None
+        return val
+
+    @field_serializer("curr_time", "act_start_time", "chatting_end_time")
+    def transform_time_field(self, time_filed: Optional[datetime]) -> str:
+        if time_filed:
+            time_filed = time_filed.strftime("%B %d, %Y, %H:%M:%S")
+        return time_filed
+
+    @classmethod
+    def init_scratch_from_path(cls, f_saved: Path):
+        scratch_load = read_json_file(f_saved)
+        scratch = Scratch(**scratch_load)
+        return scratch
+
+    def save(self, out_json: Path):
+        """
+        Save persona's scratch.
+
+        INPUT:
+          out_json: The file where we wil be saving our persona's state.
+        OUTPUT:
+          None
+        """
+        scratch = self.model_dump()
+        write_json_file(out_json, scratch, encoding="utf-8")
+
+    def get_f_daily_schedule_index(self, advance=0):
+        """
+        We get the current index of self.f_daily_schedule.
+
+        Recall that self.f_daily_schedule stores the decomposed action sequences
+        up until now, and the hourly sequences of the future action for the rest
+        of today. Given that self.f_daily_schedule is a list of list where the
+        inner list is composed of [task, duration], we continue to add up the
+        duration until we reach "if elapsed > today_min_elapsed" condition. The
+        index where we stop is the index we will return.
+
+        INPUT
+          advance: Integer value of the number minutes we want to look into the
+                   future. This allows us to get the index of a future timeframe.
+        OUTPUT
+          an integer value for the current index of f_daily_schedule.
+        """
+        # We first calculate teh number of minutes elapsed today.
+        today_min_elapsed = 0
+        today_min_elapsed += self.curr_time.hour * 60
+        today_min_elapsed += self.curr_time.minute
+        today_min_elapsed += advance
+
+        x = 0
+        for task, duration in self.f_daily_schedule:
+            x += duration
+        x = 0
+        for task, duration in self.f_daily_schedule_hourly_org:
+            x += duration
+
+        # We then calculate the current index based on that.
+        curr_index = 0
+        elapsed = 0
+        for task, duration in self.f_daily_schedule:
+            elapsed += duration
+            if elapsed > today_min_elapsed:
+                return curr_index
+            curr_index += 1
+
+        return curr_index
+
+    def get_f_daily_schedule_hourly_org_index(self, advance=0):
+        """
+        We get the current index of self.f_daily_schedule_hourly_org.
+        It is otherwise the same as get_f_daily_schedule_index.
+
+        INPUT
+          advance: Integer value of the number minutes we want to look into the
+                   future. This allows us to get the index of a future timeframe.
+        OUTPUT
+          an integer value for the current index of f_daily_schedule.
+        """
+        # We first calculate teh number of minutes elapsed today.
+        today_min_elapsed = 0
+        today_min_elapsed += self.curr_time.hour * 60
+        today_min_elapsed += self.curr_time.minute
+        today_min_elapsed += advance
+        # We then calculate the current index based on that.
+        curr_index = 0
+        elapsed = 0
+        for task, duration in self.f_daily_schedule_hourly_org:
+            elapsed += duration
+            if elapsed > today_min_elapsed:
+                return curr_index
+            curr_index += 1
+        return curr_index
+
+    def get_str_iss(self):
+        """
+        ISS stands for "identity stable set." This describes the commonset summary
+        of this persona -- basically, the bare minimum description of the persona
+        that gets used in almost all prompts that need to call on the persona.
+
+        INPUT
+          None
+        OUTPUT
+          the identity stable set summary of the persona in a string form.
+        EXAMPLE STR OUTPUT
+          "Name: Dolores Heitmiller
+           Age: 28
+           Innate traits: hard-edged, independent, loyal
+           Learned traits: Dolores is a painter who wants live quietly and paint
+             while enjoying her everyday life.
+           Currently: Dolores is preparing for her first solo show. She mostly
+             works from home.
+           Lifestyle: Dolores goes to bed around 11pm, sleeps for 7 hours, eats
+             dinner around 6pm.
+           Daily plan requirement: Dolores is planning to stay at home all day and
+             never go out."
+        """
+        commonset = ""
+        commonset += f"Name: {self.name}\n"
+        commonset += f"Age: {self.age}\n"
+        commonset += f"Innate traits: {self.innate}\n"
+        commonset += f"Learned traits: {self.learned}\n"
+        commonset += f"Currently: {self.currently}\n"
+        commonset += f"Lifestyle: {self.lifestyle}\n"
+        commonset += f"Daily plan requirement: {self.daily_plan_req}\n"
+        commonset += f"Current Date: {self.curr_time.strftime('%A %B %d') if self.curr_time else ''}\n"
+        return commonset
+
+    def get_str_name(self):
+        return self.name
+
+    def get_str_firstname(self):
+        return self.first_name
+
+    def get_str_lastname(self):
+        return self.last_name
+
+    def get_str_age(self):
+        return str(self.age)
+
+    def get_str_innate(self):
+        return self.innate
+
+    def get_str_learned(self):
+        return self.learned
+
+    def get_str_currently(self):
+        return self.currently
+
+    def get_str_lifestyle(self):
+        return self.lifestyle
+
+    def get_str_daily_plan_req(self):
+        return self.daily_plan_req
+
+    def get_str_curr_date_str(self):
+        return self.curr_time.strftime("%A %B %d")
+
+    def get_curr_event(self):
+        if not self.act_address:
+            return self.name, None, None
+        else:
+            return self.act_event
+
+    def get_curr_event_and_desc(self):
+        if not self.act_address:
+            return self.name, None, None, None
+        else:
+            return self.act_event[0], self.act_event[1], self.act_event[2], self.act_description
+
+    def get_curr_obj_event_and_desc(self):
+        if not self.act_address:
+            return "", None, None, None
+        else:
+            return self.act_address, self.act_obj_event[1], self.act_obj_event[2], self.act_obj_description
+
+    def add_new_action(
+        self,
+        action_address,
+        action_duration,
+        action_description,
+        action_pronunciatio,
+        action_event,
+        chatting_with,
+        chat,
+        chatting_with_buffer,
+        chatting_end_time,
+        act_obj_description,
+        act_obj_pronunciatio,
+        act_obj_event,
+        act_start_time=None,
+    ):
+        self.act_address = action_address
+        self.act_duration = action_duration
+        self.act_description = action_description
+        self.act_pronunciatio = action_pronunciatio
+        self.act_event = action_event
+
+        self.chatting_with = chatting_with
+        self.chat = chat
+        if chatting_with_buffer:
+            self.chatting_with_buffer.update(chatting_with_buffer)
+        self.chatting_end_time = chatting_end_time
+
+        self.act_obj_description = act_obj_description
+        self.act_obj_pronunciatio = act_obj_pronunciatio
+        self.act_obj_event = act_obj_event
+
+        self.act_start_time = self.curr_time
+
+        self.act_path_set = False
+
+    def act_time_str(self):
+        """
+        Returns a string output of the current time.
+
+        INPUT
+          None
+        OUTPUT
+          A string output of the current time.
+        EXAMPLE STR OUTPUT
+          "14:05 P.M."
+        """
+        return self.act_start_time.strftime("%H:%M %p")
+
+    def act_check_finished(self):
+        """
+        Checks whether the self.Action instance has finished.
+
+        INPUT
+          curr_datetime: Current time. If current time is later than the action's
+                         start time + its duration, then the action has finished.
+        OUTPUT
+          Boolean [True]: Action has finished.
+          Boolean [False]: Action has not finished and is still ongoing.
+        """
+        if not self.act_address:
+            return True
+
+        if self.chatting_with:
+            end_time = self.chatting_end_time
+        else:
+            x = self.act_start_time
+            if x.second != 0:
+                x = x.replace(second=0)
+                x = x + timedelta(minutes=1)
+            end_time = x + timedelta(minutes=self.act_duration)
+
+        if end_time.strftime("%H:%M:%S") == self.curr_time.strftime("%H:%M:%S"):
+            return True
+        return False
+
+    def act_summarize(self):
+        """
+        Summarize the current action as a dictionary.
+
+        INPUT
+          None
+        OUTPUT
+          ret: A human readable summary of the action.
+        """
+        exp = dict()
+        exp["persona"] = self.name
+        exp["address"] = self.act_address
+        exp["start_datetime"] = self.act_start_time
+        exp["duration"] = self.act_duration
+        exp["description"] = self.act_description
+        exp["pronunciatio"] = self.act_pronunciatio
+        return exp
+
+    def act_summary_str(self):
+        """
+        Returns a string summary of the current action. Meant to be
+        human-readable.
+
+        INPUT
+          None
+        OUTPUT
+          ret: A human readable summary of the action.
+        """
+        start_datetime_str = self.act_start_time.strftime("%A %B %d -- %H:%M %p")
+        ret = f"[{start_datetime_str}]\n"
+        ret += f"Activity: {self.name} is {self.act_description}\n"
+        ret += f"Address: {self.act_address}\n"
+        ret += f"Duration in minutes (e.g., x min): {str(self.act_duration)} min\n"
+        return ret
+
+    def get_daily_schedule(self, daily_schedule: list[list[str]]):
+        ret = ""
+        curr_min_sum = 0
+        for row in daily_schedule:
+            curr_min_sum += row[1]
+            hour = int(curr_min_sum / 60)
+            minute = curr_min_sum % 60
+            ret += f"{hour:02}:{minute:02} || {row[0]}\n"
+        return ret
+
+    def get_str_daily_schedule_summary(self):
+        return self.get_daily_schedule(self.f_daily_schedule)
+
+    def get_str_daily_schedule_hourly_org_summary(self):
+        return self.get_daily_schedule(self.f_daily_schedule_hourly_org)
diff --git a/metagpt/ext/stanford_town/memory/spatial_memory.py b/metagpt/ext/stanford_town/memory/spatial_memory.py
new file mode 100644
index 0000000000..71b8569079
--- /dev/null
+++ b/metagpt/ext/stanford_town/memory/spatial_memory.py
@@ -0,0 +1,116 @@
+"""
+Author: Joon Sung Park (joonspk@stanford.edu)
+
+File: spatial_memory.py
+Description: Defines the MemoryTree class that serves as the agents' spatial
+memory that aids in grounding their behavior in the game world.
+"""
+from pathlib import Path
+
+from pydantic import BaseModel, Field
+
+from metagpt.logs import logger
+from metagpt.utils.common import read_json_file, write_json_file
+
+
+class MemoryTree(BaseModel):
+    tree: dict = Field(default=dict)
+
+    def set_mem_path(self, f_saved: Path):
+        self.tree = read_json_file(f_saved)
+
+    def print_tree(self) -> None:
+        def _print_tree(tree, depth):
+            dash = " >" * depth
+            if isinstance(tree, list):
+                if tree:
+                    logger.info(f"{dash} {tree}")
+                return
+
+            for key, val in tree.items():
+                if key:
+                    logger.info(f"{dash} {tree}")
+                _print_tree(val, depth + 1)
+
+        _print_tree(self.tree, 0)
+
+    def save(self, out_json: Path) -> None:
+        write_json_file(out_json, self.tree)
+
+    def get_str_accessible_sectors(self, curr_world: str) -> str:
+        """
+        Returns a summary string of all the arenas that the persona can access
+        within the current sector.
+
+        Note that there are places a given persona cannot enter. This information
+        is provided in the persona sheet. We account for this in this function.
+
+        INPUT
+          None
+        OUTPUT
+          A summary string of all the arenas that the persona can access.
+        EXAMPLE STR OUTPUT
+          "bedroom, kitchen, dining room, office, bathroom"
+        """
+        x = ", ".join(list(self.tree[curr_world].keys()))
+        return x
+
+    def get_str_accessible_sector_arenas(self, sector: str) -> str:
+        """
+        Returns a summary string of all the arenas that the persona can access
+        within the current sector.
+
+        Note that there are places a given persona cannot enter. This information
+        is provided in the persona sheet. We account for this in this function.
+
+        INPUT
+          None
+        OUTPUT
+          A summary string of all the arenas that the persona can access.
+        EXAMPLE STR OUTPUT
+          "bedroom, kitchen, dining room, office, bathroom"
+        """
+        curr_world, curr_sector = sector.split(":")
+        if not curr_sector:
+            return ""
+        x = ", ".join(list(self.tree[curr_world][curr_sector].keys()))
+        return x
+
+    def get_str_accessible_arena_game_objects(self, arena: str) -> str:
+        """
+        Get a str list of all accessible game objects that are in the arena. If
+        temp_address is specified, we return the objects that are available in
+        that arena, and if not, we return the objects that are in the arena our
+        persona is currently in.
+
+        INPUT
+          temp_address: optional arena address
+        OUTPUT
+          str list of all accessible game objects in the gmae arena.
+        EXAMPLE STR OUTPUT
+          "phone, charger, bed, nightstand"
+        """
+        curr_world, curr_sector, curr_arena = arena.split(":")
+
+        if not curr_arena:
+            return ""
+
+        try:
+            x = ", ".join(list(self.tree[curr_world][curr_sector][curr_arena]))
+        except Exception:
+            x = ", ".join(list(self.tree[curr_world][curr_sector][curr_arena.lower()]))
+        return x
+
+    def add_tile_info(self, tile_info: dict) -> None:
+        if tile_info["world"]:
+            if tile_info["world"] not in self.tree:
+                self.tree[tile_info["world"]] = {}
+        if tile_info["sector"]:
+            if tile_info["sector"] not in self.tree[tile_info["world"]]:
+                self.tree[tile_info["world"]][tile_info["sector"]] = {}
+        if tile_info["arena"]:
+            if tile_info["arena"] not in self.tree[tile_info["world"]][tile_info["sector"]]:
+                self.tree[tile_info["world"]][tile_info["sector"]][tile_info["arena"]] = []
+        if tile_info["game_object"]:
+            if tile_info["game_object"] not in self.tree[tile_info["world"]][tile_info["sector"]][tile_info["arena"]]:
+                self.tree[tile_info["world"]][tile_info["sector"]][tile_info["arena"]] += [tile_info["game_object"]]
diff --git a/metagpt/ext/stanford_town/plan/__init__.py b/metagpt/ext/stanford_town/plan/__init__.py
new file mode 100644
index 0000000000..2bcf8efd09
--- /dev/null
+++ b/metagpt/ext/stanford_town/plan/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/metagpt/ext/stanford_town/plan/converse.py b/metagpt/ext/stanford_town/plan/converse.py
new file mode 100644
index 0000000000..8eefbc9b42
--- /dev/null
+++ b/metagpt/ext/stanford_town/plan/converse.py
@@ -0,0 +1,93 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : conversation between two agents
+
+from typing import Tuple
+
+from metagpt.ext.stanford_town.actions.agent_chat_sum_rel import AgentChatSumRel
+from metagpt.ext.stanford_town.actions.gen_iter_chat_utt import GenIterChatUTT
+from metagpt.ext.stanford_town.memory.retrieve import new_agent_retrieve
+from metagpt.logs import logger
+
+
+async def agent_conversation(init_role: "STRole", target_role: "STRole", conv_rounds: int = 8) -> list[list[str]]:
+    curr_chat = []
+    logger.info(f"Role: {init_role.name} starts a conversation with Role: {target_role.name}")
+
+    for idx in range(conv_rounds):
+        logger.info(f"Conv round: {idx} between {init_role.name} and {target_role.name}")
+        scratch = init_role.rc.scratch
+        target_scratch = target_role.rc.scratch
+
+        focal_points = [f"{target_scratch.name}"]
+        retrieved = new_agent_retrieve(init_role, focal_points, 50)
+        relationship = await generate_summarize_agent_relationship(init_role, target_role, retrieved)
+        logger.info(f"The relationship between {init_role.name} and {target_role.name}: {relationship}")
+        last_chat = ""
+        for i in curr_chat[-4:]:
+            last_chat += ": ".join(i) + "\n"
+        if last_chat:
+            focal_points = [f"{relationship}", f"{target_scratch.name} is {target_scratch.act_description}", last_chat]
+        else:
+            focal_points = [f"{relationship}", f"{target_scratch.name} is {target_scratch.act_description}"]
+        retrieved = new_agent_retrieve(init_role, focal_points, 15)
+        utt, end = await generate_one_utterance(init_role, target_role, retrieved, curr_chat)
+
+        curr_chat += [[scratch.name, utt]]
+        if end:
+            break
+
+        focal_points = [f"{scratch.name}"]
+        retrieved = new_agent_retrieve(target_role, focal_points, 50)
+        relationship = await generate_summarize_agent_relationship(target_role, init_role, retrieved)
+        logger.info(f"The relationship between {target_role.name} and {init_role.name}: {relationship}")
+        last_chat = ""
+        for i in curr_chat[-4:]:
+            last_chat += ": ".join(i) + "\n"
+        if last_chat:
+            focal_points = [f"{relationship}", f"{scratch.name} is {scratch.act_description}", last_chat]
+        else:
+            focal_points = [f"{relationship}", f"{scratch.name} is {scratch.act_description}"]
+        retrieved = new_agent_retrieve(target_role, focal_points, 15)
+        utt, end = await generate_one_utterance(target_role, init_role, retrieved, curr_chat)
+
+        curr_chat += [[target_scratch.name, utt]]
+        if end:
+            break
+
+    logger.warning(f"Conversations between {target_role.name} and {init_role.name}:")
+    for row in curr_chat:
+        logger.info(row)
+
+    return curr_chat
+
+
+async def generate_summarize_agent_relationship(init_role: "STRole", target_role: "STRole", retrieved: dict) -> str:
+    all_embedding_keys = list()
+    for key, val in retrieved.items():
+        for i in val:
+            all_embedding_keys += [i.embedding_key]
+    all_embedding_key_str = ""
+    for i in all_embedding_keys:
+        all_embedding_key_str += f"{i}\n"
+
+    summarized_relationship = await AgentChatSumRel().run(init_role, target_role, all_embedding_key_str)
+    return summarized_relationship
+
+
+async def generate_one_utterance(init_role, target_role, retrieved: dict, curr_chat: list) -> Tuple[str, str]:
+    # Chat version optimized for speed via batch generation
+    scratch = init_role.rc.scratch
+    target_scratch = target_role.rc.scratch
+    curr_context = (
+        f"{scratch.name} "
+        + f"was {scratch.act_description} "
+        + f"when {scratch.name} "
+        + f"saw {target_scratch.name} "
+        + f"in the middle of {target_scratch.act_description}.\n"
+    )
+    curr_context += f"{scratch.name} " + "is initiating a conversation with " + f"{target_scratch.name}."
+
+    x = await GenIterChatUTT().run(init_role, target_role, retrieved, curr_context, curr_chat)
+
+    return x["utterance"], x["end"]
diff --git a/metagpt/ext/stanford_town/plan/st_plan.py b/metagpt/ext/stanford_town/plan/st_plan.py
new file mode 100644
index 0000000000..f63052fc53
--- /dev/null
+++ b/metagpt/ext/stanford_town/plan/st_plan.py
@@ -0,0 +1,706 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : st' planning execution
+
+import datetime
+import math
+import random
+from typing import Tuple, Union
+
+from metagpt.ext.stanford_town.actions.decide_to_talk import DecideToTalk
+from metagpt.ext.stanford_town.actions.gen_action_details import GenActionDetails
+from metagpt.ext.stanford_town.actions.gen_daily_schedule import GenDailySchedule
+from metagpt.ext.stanford_town.actions.gen_hourly_schedule import GenHourlySchedule
+from metagpt.ext.stanford_town.actions.new_decomp_schedule import NewDecompSchedule
+from metagpt.ext.stanford_town.actions.summarize_conv import SummarizeConv
+from metagpt.ext.stanford_town.actions.task_decomp import TaskDecomp
+from metagpt.ext.stanford_town.actions.wake_up import WakeUp
+from metagpt.ext.stanford_town.memory.retrieve import new_agent_retrieve
+from metagpt.ext.stanford_town.plan.converse import agent_conversation
+from metagpt.ext.stanford_town.utils.utils import get_embedding
+from metagpt.llm import LLM
+from metagpt.logs import logger
+
+
+async def plan(role: "STRole", roles: dict["STRole"], new_day: bool, retrieved: dict) -> str:
+    # PART 1: Generate the hourly schedule.
+    if new_day:
+        await _long_term_planning(role, new_day)
+
+    # PART 2: If the current action has expired, we want to create a new plan.
+    act_check_finished = role.scratch.act_check_finished()
+    logger.info(f"Role: {role.name} act_check_finished is {act_check_finished}")
+    if act_check_finished:
+        await _determine_action(role)
+
+    # PART 3: If you perceived an event that needs to be responded to (saw
+    # another role), and retrieved relevant information.
+    # Step 1: Retrieved may have multiple events represented in it. The first
+    #         job here is to determine which of the events we want to focus
+    #         on for the role.
+    #         <focused_event> takes the form of a dictionary like this:
+    #         dictionary {["curr_event"] = <ConceptNode>,
+    #                     ["events"] = [<ConceptNode>, ...],
+    #                     ["thoughts"] = [<ConceptNode>, ...]}
+    focused_event = False
+    if retrieved.keys():
+        focused_event = _choose_retrieved(role.name, retrieved)
+
+    # Step 2: Once we choose an event, we need to determine whether the
+    #         role will take any actions for the perceived event. There are
+    #         three possible modes of reaction returned by _should_react.
+    #         a) "chat with {target_role.name}"
+    #         b) "react"
+    #         c) False
+    logger.info(f"Role: {role.name} focused_event: {focused_event}")
+    if focused_event:
+        reaction_mode = await _should_react(role, focused_event, roles)
+        logger.info(f"Role: {role.name} reaction_mode: {reaction_mode}")
+        if reaction_mode:
+            # If we do want to chat, then we generate conversation
+            if reaction_mode[:9] == "chat with":
+                await _chat_react(role, reaction_mode, roles)
+            elif reaction_mode[:4] == "wait":
+                await _wait_react(role, reaction_mode)
+
+    # Step 3: Chat-related state clean up.
+    # If the persona is not chatting with anyone, we clean up any of the
+    # chat-related states here.
+    if role.rc.scratch.act_event[1] != "chat with":
+        role.rc.scratch.chatting_with = None
+        role.rc.scratch.chat = None
+        role.rc.scratch.chatting_end_time = None
+    # We want to make sure that the persona does not keep conversing with each
+    # other in an infinite loop. So, chatting_with_buffer maintains a form of
+    # buffer that makes the persona wait from talking to the same target
+    # immediately after chatting once. We keep track of the buffer value here.
+    curr_persona_chat_buffer = role.rc.scratch.chatting_with_buffer
+    for persona_name, buffer_count in curr_persona_chat_buffer.items():
+        if persona_name != role.rc.scratch.chatting_with:
+            role.rc.scratch.chatting_with_buffer[persona_name] -= 1
+
+    return role.rc.scratch.act_address
+
+
+def _choose_retrieved(role_name: str, retrieved: dict) -> Union[None, dict]:
+    """
+    Retrieved elements have multiple core "curr_events". We need to choose one
+    event to which we are going to react to. We pick that event here.
+    Args:
+      role_name: Current role instance's name whose action we are determining.
+      retrieved: A dictionary of <ConceptNode> that were retrieved from the
+                 the role's associative memory. This dictionary takes the
+                 following form:
+                 dictionary[event.description] =
+                   {["curr_event"] = <ConceptNode>,
+                    ["events"] = [<ConceptNode>, ...],
+                    ["thoughts"] = [<ConceptNode>, ...] }
+    """
+    # Once we are done with the reflection, we might want to build a more
+    # complex structure here.
+
+    # We do not want to take self events... for now
+    copy_retrieved = retrieved.copy()
+    for event_desc, rel_ctx in copy_retrieved.items():
+        curr_event = rel_ctx["curr_event"]
+        if curr_event.subject == role_name:
+            del retrieved[event_desc]
+
+    # Always choose role first.
+    priority = []
+    for event_desc, rel_ctx in retrieved.items():
+        curr_event = rel_ctx["curr_event"]
+        if ":" not in curr_event.subject and curr_event.subject != role_name:
+            priority += [rel_ctx]
+    if priority:
+        return random.choice(priority)
+
+    # Skip idle.
+    for event_desc, rel_ctx in retrieved.items():
+        if "is idle" not in event_desc:
+            priority += [rel_ctx]
+    if priority:
+        return random.choice(priority)
+    return None
+
+
+async def _should_react(role: "STRole", retrieved: dict, roles: dict):
+    """
+    Determines what form of reaction the role should exihibit given the
+    retrieved values.
+    INPUT
+      role: Current <"STRole"> instance whose action we are determining.
+      retrieved: A dictionary of <ConceptNode> that were retrieved from the
+                 the role's associative memory. This dictionary takes the
+                 following form:
+                 dictionary[event.description] =
+                   {["curr_event"] = <ConceptNode>,
+                    ["events"] = [<ConceptNode>, ...],
+                    ["thoughts"] = [<ConceptNode>, ...] }
+      roles: A dictionary that contains all role names as keys, and the
+                <"STRole"> instance as values.
+    """
+
+    async def lets_talk(init_role: "STRole", target_role: "STRole", retrieved: dict):
+        if init_role.name == target_role.name:
+            logger.info(f"Role: {role.name} _should_react lets_talk meet same role, return False")
+            return False
+
+        scratch = init_role.rc.scratch
+        target_scratch = target_role.rc.scratch
+        if (
+            not target_scratch.act_address
+            or not target_scratch.act_description
+            or not scratch.act_address
+            or not scratch.act_description
+        ):
+            return False
+
+        if "sleeping" in target_scratch.act_description or "sleeping" in scratch.act_description:
+            return False
+
+        if scratch.curr_time.hour == 23:
+            return False
+
+        if "<waiting>" in target_scratch.act_address:
+            return False
+
+        if target_scratch.chatting_with or scratch.chatting_with:
+            return False
+
+        if target_role.name in scratch.chatting_with_buffer:
+            if scratch.chatting_with_buffer[target_role.name] > 0:
+                return False
+
+        if await DecideToTalk().run(init_role, target_role, retrieved):
+            return True
+
+        return False
+
+    async def lets_react(init_role: "STRole", target_role: "STRole", retrieved: dict):
+        if init_role.name == target_role.name:
+            logger.info(f"Role: {role.name} _should_react lets_react meet same role, return False")
+            return False
+
+        scratch = init_role.rc.scratch
+        target_scratch = target_role.rc.scratch
+        if (
+            not target_scratch.act_address
+            or not target_scratch.act_description
+            or not scratch.act_address
+            or not scratch.act_description
+        ):
+            return False
+
+        if "sleeping" in target_scratch.act_description or "sleeping" in scratch.act_description:
+            return False
+
+        # return False
+        if scratch.curr_time.hour == 23:
+            return False
+
+        if "waiting" in target_scratch.act_description:
+            return False
+        if scratch.planned_path == []:
+            return False
+
+        if scratch.act_address != target_scratch.act_address:
+            return False
+
+        react_mode = await DecideToTalk().run(init_role, target_role, retrieved)
+
+        if react_mode == "1":
+            wait_until = (
+                target_scratch.act_start_time + datetime.timedelta(minutes=target_scratch.act_duration - 1)
+            ).strftime("%B %d, %Y, %H:%M:%S")
+            return f"wait: {wait_until}"
+        elif react_mode == "2":
+            return False
+            return "do other things"
+        else:
+            return False  # "keep"
+
+    # If the role is chatting right now, default to no reaction
+    scratch = role.rc.scratch
+    if scratch.chatting_with:
+        return False
+    if "<waiting>" in scratch.act_address:
+        return False
+
+    # Recall that retrieved takes the following form:
+    # dictionary {["curr_event"] = <ConceptNode>}
+    curr_event = retrieved["curr_event"]
+    logger.info(f"Role: {role.name} _should_react curr_event.subject: {curr_event.subject}")
+
+    if ":" not in curr_event.subject:
+        # this is a role event.
+        if await lets_talk(role, roles[curr_event.subject], retrieved):
+            return f"chat with {curr_event.subject}"
+        react_mode = await lets_react(role, roles[curr_event.subject], retrieved)
+        return react_mode
+    return False
+
+
+async def _chat_react(role: "STRole", reaction_mode: str, roles: dict["STRole"]):
+    # There are two roles -- the role who is initiating the conversation
+    # and the role who is the target. We get the role instances here.
+    init_role = role
+    target_role = roles[reaction_mode[9:].strip()]
+
+    # Actually creating the conversation here.
+    convo, duration_min = await generate_convo(init_role, target_role)  # 2222
+    convo_summary = await generate_convo_summary(convo)
+    inserted_act = convo_summary
+    inserted_act_dur = duration_min
+
+    act_start_time = target_role.rc.scratch.act_start_time
+
+    curr_time = target_role.rc.scratch.curr_time
+    if curr_time.second != 0:
+        temp_curr_time = curr_time + datetime.timedelta(seconds=60 - curr_time.second)
+        chatting_end_time = temp_curr_time + datetime.timedelta(minutes=inserted_act_dur)
+    else:
+        chatting_end_time = curr_time + datetime.timedelta(minutes=inserted_act_dur)
+
+    for role, p in [("init", init_role), ("target", target_role)]:
+        if role == "init":
+            act_address = f"<persona> {target_role.name}"
+            act_event = (p.name, "chat with", target_role.name)
+            chatting_with = target_role.name
+            chatting_with_buffer = {}
+            chatting_with_buffer[target_role.name] = 800
+        elif role == "target":
+            act_address = f"<persona> {init_role.name}"
+            act_event = (p.name, "chat with", init_role.name)
+            chatting_with = init_role.name
+            chatting_with_buffer = {}
+            chatting_with_buffer[init_role.name] = 800
+
+        act_pronunciatio = "💬"
+        act_obj_description = None
+        act_obj_pronunciatio = None
+        act_obj_event = (None, None, None)
+
+        await _create_react(
+            p,
+            inserted_act,
+            inserted_act_dur,
+            act_address,
+            act_event,
+            chatting_with,
+            convo,
+            chatting_with_buffer,
+            chatting_end_time,
+            act_pronunciatio,
+            act_obj_description,
+            act_obj_pronunciatio,
+            act_obj_event,
+            act_start_time,
+        )
+
+
+async def _create_react(
+    role: "STRole",
+    inserted_act: str,
+    inserted_act_dur: int,
+    act_address: str,
+    act_event: Tuple,
+    chatting_with: str,
+    chat: list,
+    chatting_with_buffer: dict,
+    chatting_end_time: datetime,
+    act_pronunciatio: str,
+    act_obj_description: str,
+    act_obj_pronunciatio: str,
+    act_obj_event: Tuple,
+    act_start_time=None,
+):
+    p = role
+    scratch = role.rc.scratch
+
+    min_sum = 0
+    for i in range(scratch.get_f_daily_schedule_hourly_org_index()):
+        min_sum += scratch.f_daily_schedule_hourly_org[i][1]
+    start_hour = int(min_sum / 60)
+
+    if scratch.f_daily_schedule_hourly_org[scratch.get_f_daily_schedule_hourly_org_index()][1] >= 120:
+        end_hour = (
+            start_hour + scratch.f_daily_schedule_hourly_org[scratch.get_f_daily_schedule_hourly_org_index()][1] / 60
+        )
+
+    elif (
+        scratch.f_daily_schedule_hourly_org[scratch.get_f_daily_schedule_hourly_org_index()][1]
+        + scratch.f_daily_schedule_hourly_org[scratch.get_f_daily_schedule_hourly_org_index() + 1][1]
+    ):
+        end_hour = start_hour + (
+            (
+                scratch.f_daily_schedule_hourly_org[scratch.get_f_daily_schedule_hourly_org_index()][1]
+                + scratch.f_daily_schedule_hourly_org[scratch.get_f_daily_schedule_hourly_org_index() + 1][1]
+            )
+            / 60
+        )
+
+    else:
+        end_hour = start_hour + 2
+    end_hour = int(end_hour)
+
+    dur_sum = 0
+    count = 0
+    start_index = None
+    end_index = None
+    for act, dur in scratch.f_daily_schedule:
+        if dur_sum >= start_hour * 60 and start_index is None:
+            start_index = count
+        if dur_sum >= end_hour * 60 and end_index is None:
+            end_index = count
+        dur_sum += dur
+        count += 1
+
+    ret = await generate_new_decomp_schedule(p, inserted_act, inserted_act_dur, start_hour, end_hour)
+    scratch.f_daily_schedule[start_index:end_index] = ret
+    scratch.add_new_action(
+        act_address,
+        inserted_act_dur,
+        inserted_act,
+        act_pronunciatio,
+        act_event,
+        chatting_with,
+        chat,
+        chatting_with_buffer,
+        chatting_end_time,
+        act_obj_description,
+        act_obj_pronunciatio,
+        act_obj_event,
+        act_start_time,
+    )
+
+
+async def _wait_react(role: "STRole", reaction_mode: str):
+    scratch = role.rc.scratch
+
+    inserted_act = f'waiting to start {scratch.act_description.split("(")[-1][:-1]}'
+    end_time = datetime.datetime.strptime(reaction_mode[6:].strip(), "%B %d, %Y, %H:%M:%S")
+    inserted_act_dur = (
+        (end_time.minute + end_time.hour * 60) - (scratch.curr_time.minute + scratch.curr_time.hour * 60) + 1
+    )
+
+    act_address = f"<waiting> {scratch.curr_tile[0]} {scratch.curr_tile[1]}"
+    act_event = (role.name, "waiting to start", scratch.act_description.split("(")[-1][:-1])
+    chatting_with = None
+    chat = None
+    chatting_with_buffer = None
+    chatting_end_time = None
+
+    act_pronunciatio = "⌛"
+    act_obj_description = None
+    act_obj_pronunciatio = None
+    act_obj_event = (None, None, None)
+
+    await _create_react(
+        role,
+        inserted_act,
+        inserted_act_dur,
+        act_address,
+        act_event,
+        chatting_with,
+        chat,
+        chatting_with_buffer,
+        chatting_end_time,
+        act_pronunciatio,
+        act_obj_description,
+        act_obj_pronunciatio,
+        act_obj_event,
+    )
+
+
+async def generate_convo(init_role: "STRole", target_role: "STRole") -> Union[list, int]:
+    convo = await agent_conversation(init_role, target_role)
+    all_utt = ""
+
+    for row in convo:
+        speaker = row[0]
+        utt = row[1]
+        all_utt += f"{speaker}: {utt}\n"
+
+    convo_length = math.ceil(int(len(all_utt) / 8) / 30)
+
+    return convo, convo_length
+
+
+async def generate_convo_summary(conv: list[list[str]]) -> str:
+    conv_summary = await SummarizeConv().run(conv)
+    return conv_summary
+
+
+async def generate_new_decomp_schedule(
+    role: "STRole", inserted_act: str, inserted_act_dur: int, start_hour: int, end_hour: int
+):
+    # Step 1: Setting up the core variables for the function.
+    # <p> is the role whose schedule we are editing right now.
+    scratch = role.rc.scratch
+    # <today_min_pass> indicates the number of minutes that have passed today.
+    today_min_pass = int(scratch.curr_time.hour) * 60 + int(scratch.curr_time.minute) + 1
+
+    # Step 2: We need to create <main_act_dur> and <truncated_act_dur>.
+    main_act_dur = []
+    truncated_act_dur = []
+    dur_sum = 0  # duration sum
+    count = 0  # enumerate count
+    truncated_fin = False
+
+    logger.debug(f"DEBUG::: {scratch.name}")
+    for act, dur in scratch.f_daily_schedule:
+        if (dur_sum >= start_hour * 60) and (dur_sum < end_hour * 60):
+            main_act_dur += [[act, dur]]
+            if dur_sum <= today_min_pass:
+                truncated_act_dur += [[act, dur]]
+            elif dur_sum > today_min_pass and not truncated_fin:
+                # We need to insert that last act, duration list like this one:
+                # e.g., ['wakes up and completes her morning routine (wakes up...)', 2]
+                truncated_act_dur += [[scratch.f_daily_schedule[count][0], dur_sum - today_min_pass]]
+                truncated_act_dur[-1][-1] -= (
+                    dur_sum - today_min_pass
+                )  # DEC 7 DEBUG;.. is the +1 the right thing to do???
+                # DEC 7 DEBUG;.. is the +1 the right thing to do???
+                # truncated_act_dur[-1][-1] -= (dur_sum - today_min_pass + 1)
+                logger.debug(f"DEBUG::: {truncated_act_dur}")
+
+                # DEC 7 DEBUG;.. is the +1 the right thing to do???
+                # truncated_act_dur[-1][-1] -= (dur_sum - today_min_pass)
+                truncated_fin = True
+        dur_sum += dur
+        count += 1
+
+    main_act_dur = main_act_dur
+
+    x = (
+        truncated_act_dur[-1][0].split("(")[0].strip()
+        + " (on the way to "
+        + truncated_act_dur[-1][0].split("(")[-1][:-1]
+        + ")"
+    )
+    truncated_act_dur[-1][0] = x
+
+    if "(" in truncated_act_dur[-1][0]:
+        inserted_act = truncated_act_dur[-1][0].split("(")[0].strip() + " (" + inserted_act + ")"
+
+    # To do inserted_act_dur+1 below is an important decision but I'm not sure
+    # if I understand the full extent of its implications. Might want to
+    # revisit.
+    truncated_act_dur += [[inserted_act, inserted_act_dur]]
+    start_time_hour = datetime.datetime(2022, 10, 31, 0, 0) + datetime.timedelta(hours=start_hour)
+    end_time_hour = datetime.datetime(2022, 10, 31, 0, 0) + datetime.timedelta(hours=end_hour)
+
+    return await NewDecompSchedule().run(
+        role, main_act_dur, truncated_act_dur, start_time_hour, end_time_hour, inserted_act, inserted_act_dur
+    )
+
+
+async def _long_term_planning(role: "STRole", new_day: bool):
+    """
+    Formulates the role's daily long-term plan if it is the start of a new
+    day. This basically has two components: first, we create the wake-up hour,
+    and second, we create the hourly schedule based on it.
+    INPUT
+        new_day: Indicates whether the current time signals a "First day",
+                "New day", or False (for neither). This is important because we
+                create the roles' long term planning on the new day.
+    """
+    # We start by creating the wake up hour for the role.
+    wake_up_hour = await WakeUp().run(role)
+    wake_up_hour = int(wake_up_hour)
+    logger.info(f"Role: {role.name} long_term_planning, wake_up_hour: {wake_up_hour}")
+
+    # When it is a new day, we start by creating the daily_req of the role.
+    # Note that the daily_req is a list of strings that describe the role's
+    # day in broad strokes.
+    if new_day == "First day":
+        # Bootstrapping the daily plan for the start of then generation:
+        # if this is the start of generation (so there is no previous day's
+        # daily requirement, or if we are on a new day, we want to create a new
+        # set of daily requirements.
+        role.scratch.daily_req = await GenDailySchedule().run(role, wake_up_hour)
+        logger.info(f"Role: {role.name} daily requirements: {role.scratch.daily_req}")
+    elif new_day == "New day":
+        revise_identity(role)
+
+        # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - TODO
+        # We need to create a new daily_req here...
+        role.scratch.daily_req = role.scratch.daily_req
+
+    # Based on the daily_req, we create an hourly schedule for the role,
+    # which is a list of todo items with a time duration (in minutes) that
+    # add up to 24 hours.
+    role.scratch.f_daily_schedule = await GenHourlySchedule().run(role, wake_up_hour)
+    logger.info(f"Role: {role.name} f_daily_schedule: {role.scratch.f_daily_schedule}")
+    role.scratch.f_daily_schedule_hourly_org = role.scratch.f_daily_schedule[:]
+
+    # Added March 4 -- adding plan to the memory.
+    thought = f"This is {role.scratch.name}'s plan for {role.scratch.curr_time.strftime('%A %B %d')}:"
+    for i in role.scratch.daily_req:
+        thought += f" {i},"
+    thought = thought[:-1] + "."
+    created = role.scratch.curr_time
+    expiration = role.scratch.curr_time + datetime.timedelta(days=30)
+    s, p, o = (role.scratch.name, "plan", role.scratch.curr_time.strftime("%A %B %d"))
+    keywords = set(["plan"])
+    thought_poignancy = 5
+    thought_embedding_pair = (thought, get_embedding(thought))
+    role.a_mem.add_thought(
+        created, expiration, s, p, o, thought, keywords, thought_poignancy, thought_embedding_pair, None
+    )
+
+
+async def _determine_action(role: "STRole"):
+    """
+    Creates the next action sequence for the role.
+    The main goal of this function is to run "add_new_action" on the role's
+    scratch space, which sets up all the action related variables for the next
+    action.
+    As a part of this, the role may need to decompose its hourly schedule as
+    needed.
+    INPUT
+        role: Current <Persona> instance whose action we are determining.
+    """
+
+    def determine_decomp(act_desp, act_dura):
+        """
+        Given an action description and its duration, we determine whether we need
+        to decompose it. If the action is about the agent sleeping, we generally
+        do not want to decompose it, so that's what we catch here.
+
+        INPUT:
+        act_desp: the description of the action (e.g., "sleeping")
+        act_dura: the duration of the action in minutes.
+        OUTPUT:
+        a boolean. True if we need to decompose, False otherwise.
+        """
+        if "sleep" not in act_desp and "bed" not in act_desp:
+            return True
+        elif "sleeping" in act_desp or "asleep" in act_desp or "in bed" in act_desp:
+            return False
+        elif "sleep" in act_desp or "bed" in act_desp:
+            if act_dura > 60:
+                return False
+        return True
+
+    # The goal of this function is to get us the action associated with
+    # <curr_index>. As a part of this, we may need to decompose some large
+    # chunk actions.
+    # Importantly, we try to decompose at least two hours worth of schedule at
+    # any given point.
+    curr_index = role.scratch.get_f_daily_schedule_index()
+    curr_index_60 = role.scratch.get_f_daily_schedule_index(advance=60)
+
+    logger.info(f"f_daily_schedule: {role.scratch.f_daily_schedule}")
+    # * Decompose *
+    # During the first hour of the day, we need to decompose two hours
+    # sequence. We do that here.
+    if curr_index == 0:
+        # This portion is invoked if it is the first hour of the day.
+        act_desp, act_dura = role.scratch.f_daily_schedule[curr_index]
+        if act_dura >= 60:
+            # We decompose if the next action is longer than an hour, and fits the
+            # criteria described in determine_decomp.
+            if determine_decomp(act_desp, act_dura):
+                role.scratch.f_daily_schedule[curr_index : curr_index + 1] = await TaskDecomp().run(
+                    role, act_desp, act_dura
+                )
+        if curr_index_60 + 1 < len(role.scratch.f_daily_schedule):
+            act_desp, act_dura = role.scratch.f_daily_schedule[curr_index_60 + 1]
+            if act_dura >= 60:
+                if determine_decomp(act_desp, act_dura):
+                    role.scratch.f_daily_schedule[curr_index_60 + 1 : curr_index_60 + 2] = await TaskDecomp().run(
+                        role, act_desp, act_dura
+                    )
+
+    if curr_index_60 < len(role.scratch.f_daily_schedule):
+        # If it is not the first hour of the day, this is always invoked (it is
+        # also invoked during the first hour of the day -- to double up so we can
+        # decompose two hours in one go). Of course, we need to have something to
+        # decompose as well, so we check for that too.
+        if role.scratch.curr_time.hour < 23:
+            # And we don't want to decompose after 11 pm.
+            act_desp, act_dura = role.scratch.f_daily_schedule[curr_index_60]
+            if act_dura >= 60:
+                if determine_decomp(act_desp, act_dura):
+                    role.scratch.f_daily_schedule[curr_index_60 : curr_index_60 + 1] = await TaskDecomp().run(
+                        role, act_desp, act_dura
+                    )
+    # * End of Decompose *
+
+    # Generate an <Action> instance from the action description and duration. By
+    # this point, we assume that all the relevant actions are decomposed and
+    # ready in f_daily_schedule.
+    logger.debug("DEBUG LJSDLFSKJF")
+    for i in role.scratch.f_daily_schedule:
+        logger.debug(i)
+    logger.debug(curr_index)
+    logger.debug(len(role.scratch.f_daily_schedule))
+    logger.debug(role.scratch.name)
+
+    # 1440
+    x_emergency = 0
+    for i in role.scratch.f_daily_schedule:
+        x_emergency += i[1]
+
+    if 1440 - x_emergency > 0:
+        logger.info(f"x_emergency__AAA: {x_emergency}")
+    role.scratch.f_daily_schedule += [["sleeping", 1440 - x_emergency]]
+
+    act_desp, act_dura = role.scratch.f_daily_schedule[curr_index]
+
+    new_action_details = await GenActionDetails().run(role, act_desp, act_dura)
+    # Adding the action to role's queue.
+    role.scratch.add_new_action(**new_action_details)
+
+
+def revise_identity(role: "STRole"):
+    p_name = role.scratch.name
+
+    focal_points = [
+        f"{p_name}'s plan for {role.scratch.get_str_curr_date_str()}.",
+        f"Important recent events for {p_name}'s life.",
+    ]
+    retrieved = new_agent_retrieve(role, focal_points)
+
+    statements = "[Statements]\n"
+    for key, val in retrieved.items():
+        for i in val:
+            statements += f"{i.created.strftime('%A %B %d -- %H:%M %p')}: {i.embedding_key}\n"
+
+    plan_prompt = statements + "\n"
+    plan_prompt += f"Given the statements above, is there anything that {p_name} should remember as they plan for"
+    plan_prompt += f" *{role.scratch.curr_time.strftime('%A %B %d')}*? "
+    plan_prompt += "If there is any scheduling information, be as specific as possible (include date, time, and location if stated in the statement)\n\n"
+    plan_prompt += f"Write the response from {p_name}'s perspective."
+    plan_note = LLM().ask(plan_prompt)
+
+    thought_prompt = statements + "\n"
+    thought_prompt += (
+        f"Given the statements above, how might we summarize {p_name}'s feelings about their days up to now?\n\n"
+    )
+    thought_prompt += f"Write the response from {p_name}'s perspective."
+    thought_note = LLM().ask(thought_prompt)
+
+    currently_prompt = (
+        f"{p_name}'s status from {(role.scratch.curr_time - datetime.timedelta(days=1)).strftime('%A %B %d')}:\n"
+    )
+    currently_prompt += f"{role.scratch.currently}\n\n"
+    currently_prompt += f"{p_name}'s thoughts at the end of {(role.scratch.curr_time - datetime.timedelta(days=1)).strftime('%A %B %d')}:\n"
+    currently_prompt += (plan_note + thought_note).replace("\n", "") + "\n\n"
+    currently_prompt += f"It is now {role.scratch.curr_time.strftime('%A %B %d')}. Given the above, write {p_name}'s status for {role.scratch.curr_time.strftime('%A %B %d')} that reflects {p_name}'s thoughts at the end of {(role.scratch.curr_time - datetime.timedelta(days=1)).strftime('%A %B %d')}. Write this in third-person talking about {p_name}."
+    currently_prompt += "If there is any scheduling information, be as specific as possible (include date, time, and location if stated in the statement).\n\n"
+    currently_prompt += "Follow this format below:\nStatus: <new status>"
+    new_currently = LLM().ask(currently_prompt)
+
+    role.scratch.currently = new_currently
+
+    daily_req_prompt = role.scratch.get_str_iss() + "\n"
+    daily_req_prompt += f"Today is {role.scratch.curr_time.strftime('%A %B %d')}. Here is {role.scratch.name}'s plan today in broad-strokes (with the time of the day. e.g., have a lunch at 12:00 pm, watch TV from 7 to 8 pm).\n\n"
+    daily_req_prompt += "Follow this format (the list should have 4~6 items but no more):\n"
+    daily_req_prompt += "1. wake up and complete the morning routine at <time>, 2. ..."
+
+    new_daily_req = LLM().ask(daily_req_prompt)
+    new_daily_req = new_daily_req.replace("\n", " ")
+    role.scratch.daily_plan_req = new_daily_req
diff --git a/metagpt/ext/stanford_town/prompts/__init__.py b/metagpt/ext/stanford_town/prompts/__init__.py
new file mode 100644
index 0000000000..2af51b8dc7
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : stanford town prompt templates
diff --git a/metagpt/ext/stanford_town/prompts/action_location_object_vMar11.txt b/metagpt/ext/stanford_town/prompts/action_location_object_vMar11.txt
new file mode 100644
index 0000000000..908750646d
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/action_location_object_vMar11.txt
@@ -0,0 +1,30 @@
+Variables: 
+!<INPUT 0>! -- Persona name
+!<INPUT 1>! -- Persona's current arena
+!<INPUT 2>! -- Persona's current sector
+!<INPUT 3>! -- Persona name
+!<INPUT 4>! -- target sector
+!<INPUT 5>! -- Persona's sector's all arenas (minus no access)
+!<INPUT 6>! -- Curr action seq
+!<INPUT 7>! -- Persona name
+!<INPUT 8>! -- Persona's current sector
+
+<commentblockmarker>###</commentblockmarker>
+Jane Anderson is in kitchen in Jane Anderson's house.
+Jane Anderson is going to Jane Anderson's house that has the following areas: {kitchen,  bedroom, bathroom}
+Stay in the current area if the activity can be done there. Never go into other people's rooms unless necessary.
+For cooking, Jane Anderson should go to the following area in Jane Anderson's house:
+Answer: {kitchen}
+---
+Tom Watson is in common room in Tom Watson's apartment. 
+Tom Watson is going to Hobbs Cafe that has the following areas: {cafe}
+Stay in the current area if the activity can be done there. Never go into other people's rooms unless necessary.
+For getting coffee, Tom Watson should go to the following area in Hobbs Cafe:
+Answer: {cafe}
+---
+
+!<INPUT 0>! is going to !<INPUT 1>! that has the following areas: {!<INPUT 2>!}
+* Stay in the current area if the activity can be done there. 
+* NEVER go into other people's rooms unless necessary.
+!<INPUT 3>! is !<INPUT 4>!. For !<INPUT 5>!, !<INPUT 6>! should go to the following area in !<INPUT 7>! (MUST pick one of {!<INPUT 8>!}):
+Answer: {
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/action_location_sector_v1.txt b/metagpt/ext/stanford_town/prompts/action_location_sector_v1.txt
new file mode 100644
index 0000000000..f93ed96e09
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/action_location_sector_v1.txt
@@ -0,0 +1,34 @@
+Variables: 
+!<INPUT 0>! -- Persona name
+!<INPUT 1>! -- Maze all possible sectors
+!<INPUT 2>! -- Persona name
+!<INPUT 3>! -- Persona living sector
+!<INPUT 4>! -- Persona living sector arenas
+!<INPUT 5>! -- Persona name
+!<INPUT 6>! -- Persona current sector
+!<INPUT 7>! -- Persona current sector arenas
+!<INPUT 8>! -- curr action description
+!<INPUT 9>! -- Persona name
+<commentblockmarker>###</commentblockmarker>
+Task -- choose an appropriate area  from the area options for a task at hand. 
+
+Sam Kim lives in {Sam Kim's house} that has Sam Kim's room, bathroom, kitchen.
+Sam Kim is currently in {Sam Kim's house} that has Sam Kim's room, bathroom, kitchen. 
+Area options: {Sam Kim's house, The Rose and Crown Pub, Hobbs Cafe, Oak Hill College, Johnson Park, Harvey Oak Supply Store, The Willows Market and Pharmacy}.
+* Stay in the current area if the activity can be done there. Only go out if the activity needs to take place in another place.
+* Must be one of the "Area options," verbatim.
+For taking a walk, Sam Kim should go to the following area: {Johnson Park}
+---
+Jane Anderson lives in {Oak Hill College Student Dormatory} that has Jane Anderson's room.
+Jane Anderson is currently in {Oak Hill College} that has a classroom, library
+Area options: {Oak Hill College Student Dormatory, The Rose and Crown Pub, Hobbs Cafe, Oak Hill College, Johnson Park, Harvey Oak Supply Store, The Willows Market and Pharmacy}. 
+* Stay in the current area if the activity can be done there. Only go out if the activity needs to take place in another place.
+* Must be one of the "Area options," verbatim.
+For eating dinner, Jane Anderson should go to the following area: {Hobbs Cafe}
+---
+!<INPUT 0>! lives in {!<INPUT 1>!} that has !<INPUT 2>!.
+!<INPUT 3>! is currently in {!<INPUT 4>!} that has !<INPUT 5>!. !<INPUT 6>!
+Area options: {!<INPUT 7>!}. 
+* Stay in the current area if the activity can be done there. Only go out if the activity needs to take place in another place.
+* Must be one of the "Area options," verbatim.
+!<INPUT 8>! is !<INPUT 9>!. For !<INPUT 10>!, !<INPUT 11>! should go to the following area: {
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/action_object_v2.txt b/metagpt/ext/stanford_town/prompts/action_object_v2.txt
new file mode 100644
index 0000000000..1a8a78e165
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/action_object_v2.txt
@@ -0,0 +1,32 @@
+Variables: 
+!<INPUT 0>! -- curr action seq
+!<INPUT 1>! -- Objects available
+
+<commentblockmarker>###</commentblockmarker>
+Current activity: sleep in bed
+Objects available: {bed, easel, closet, painting}
+Pick ONE most relevant object from the objects available: bed
+---
+Current activity: painting
+Objects available: {easel, closet, sink, microwave}
+Pick ONE most relevant object from the objects available: easel
+---
+Current activity: cooking
+Objects available: {stove, sink, fridge, counter}
+Pick ONE most relevant object from the objects available: stove
+---
+Current activity: watch TV
+Objects available: {couch, TV, remote, coffee table}
+Pick ONE most relevant object from the objects available: TV
+---
+Current activity: study
+Objects available: {desk, computer, chair, bookshelf}
+Pick ONE most relevant object from the objects available: desk
+---
+Current activity: talk on the phone
+Objects available: {phone, charger, bed, nightstand}
+Pick ONE most relevant object from the objects available: phone
+---
+Current activity: !<INPUT 0>!
+Objects available: {!<INPUT 1>!}
+Pick ONE most relevant object from the objects available:
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/daily_planning_v6.txt b/metagpt/ext/stanford_town/prompts/daily_planning_v6.txt
new file mode 100644
index 0000000000..dea6a28d7b
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/daily_planning_v6.txt
@@ -0,0 +1,14 @@
+daily_planning_v6.txt
+
+Variables: 
+!<INPUT 0>! -- Commonset
+!<INPUT 1>! -- Lifestyle
+!<INPUT 2>! -- Reverie date time now
+!<INPUT 3>! -- Persona first names
+!<INPUT 4>! -- wake_up_hour
+
+<commentblockmarker>###</commentblockmarker>
+!<INPUT 0>!
+
+In general, !<INPUT 1>!
+Today is !<INPUT 2>!. Here is !<INPUT 3>!'s plan today in broad-strokes (with the time of the day. e.g., have a lunch at 12:00 pm, watch TV from 7 to 8 pm): 1) wake up and complete the morning routine at !<INPUT 4>!, 2)
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/decide_to_talk_v2.txt b/metagpt/ext/stanford_town/prompts/decide_to_talk_v2.txt
new file mode 100644
index 0000000000..94204f9eb6
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/decide_to_talk_v2.txt
@@ -0,0 +1,18 @@
+decide_to_talk_v1.txt
+
+<commentblockmarker>###</commentblockmarker>
+Task -- given context, determine whether the subject will initiate a conversation with another. 
+Format: 
+Context: []
+Question: []
+Reasoning: []
+Answer in "yes" or "no": []
+---
+Context: !<INPUT 0>! 
+Right now, it is !<INPUT 1>!. !<INPUT 2>! and !<INPUT 3>! last chatted at !<INPUT 4>! about !<INPUT 5>!. 
+!<INPUT 6>! 
+!<INPUT 7>! 
+
+Question: Would !<INPUT 8>! initiate a conversation with !<INPUT 9>!? 
+
+Reasoning: Let's think step by step.
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/generate_event_triple_v1.txt b/metagpt/ext/stanford_town/prompts/generate_event_triple_v1.txt
new file mode 100644
index 0000000000..1e9b7d6d55
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/generate_event_triple_v1.txt
@@ -0,0 +1,30 @@
+generate_event_triple_v1.txt
+
+Variables: 
+!<INPUT 0>! -- Persona's full name. 
+!<INPUT 1>! -- Current action description
+!<INPUT 2>! -- Persona's full name. 
+
+<commentblockmarker>###</commentblockmarker>
+Task: Turn the input into (subject, predicate, object). 
+
+Input: Sam Johnson is eating breakfast. 
+Output: (Dolores Murphy, eat, breakfast) 
+--- 
+Input: Joon Park is brewing coffee.
+Output: (Joon Park, brew, coffee)
+---
+Input: Jane Cook is sleeping. 
+Output: (Jane Cook, is, sleep)
+---
+Input: Michael Bernstein is writing email on a computer. 
+Output: (Michael Bernstein, write, email)
+---
+Input: Percy Liang is teaching students in a classroom. 
+Output: (Percy Liang, teach, students)
+---
+Input: Merrie Morris is running on a treadmill. 
+Output: (Merrie Morris, run, treadmill)
+---
+Input: !<INPUT 0>! is !<INPUT 1>!. 
+Output: (!<INPUT 2>!,
diff --git a/metagpt/ext/stanford_town/prompts/generate_focal_pt_v1.txt b/metagpt/ext/stanford_town/prompts/generate_focal_pt_v1.txt
new file mode 100644
index 0000000000..73f76ec61b
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/generate_focal_pt_v1.txt
@@ -0,0 +1,11 @@
+generate_focal_pt_v1.txt
+
+Variables: 
+!<INPUT 0>! -- Event/thought statements 
+!<INPUT 1>! -- Count 
+
+<commentblockmarker>###</commentblockmarker>
+!<INPUT 0>!
+
+Given only the information above, what are !<INPUT 1>! most salient high-level questions we can answer about the subjects grounded in the statements?
+1)
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/generate_hourly_schedule_v2.txt b/metagpt/ext/stanford_town/prompts/generate_hourly_schedule_v2.txt
new file mode 100644
index 0000000000..2d6f5762c0
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/generate_hourly_schedule_v2.txt
@@ -0,0 +1,18 @@
+generate_hourly_schedule_v2.txt
+
+Variables: 
+!<INPUT 0>! -- Schedule format
+!<INPUT 1>! -- Commonset
+!<INPUT 2>! -- prior_schedule
+!<INPUT 3>! -- intermission_str
+!<INPUT 4>! -- intermission 2
+!<INPUT 5>! -- prompt_ending
+
+<commentblockmarker>###</commentblockmarker>
+Hourly schedule format: 
+!<INPUT 0>!
+===
+!<INPUT 1>!
+!<INPUT 2>!
+!<INPUT 3>!!<INPUT 4>!
+!<INPUT 5>!
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/generate_obj_event_v1.txt b/metagpt/ext/stanford_town/prompts/generate_obj_event_v1.txt
new file mode 100644
index 0000000000..e8d45e6381
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/generate_obj_event_v1.txt
@@ -0,0 +1,16 @@
+generate_obj_event_v1.txt
+
+Variables: 
+!<INPUT 0>! -- Object name 
+!<INPUT 1>! -- Persona name
+!<INPUT 2>! -- Persona action event description 
+!<INPUT 3>! -- Object name 
+!<INPUT 4>! -- Object name 
+
+<commentblockmarker>###</commentblockmarker>
+Task: We want to understand the state of an object that is being used by someone. 
+
+Let's think step by step. 
+We want to know about !<INPUT 0>!'s state. 
+Step 1. !<INPUT 1>! is at/using the !<INPUT 2>!.
+Step 2. Describe the !<INPUT 3>!'s state: !<INPUT 4>! is
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/generate_pronunciatio_v1.txt b/metagpt/ext/stanford_town/prompts/generate_pronunciatio_v1.txt
new file mode 100644
index 0000000000..fd208df187
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/generate_pronunciatio_v1.txt
@@ -0,0 +1,10 @@
+generate_pronunciatio_v1.txt
+
+Variables: 
+!<INPUT 0>! -- Action description
+
+<commentblockmarker>###</commentblockmarker>
+Convert an action description to an emoji (important: use two or less emojis).
+
+Action description: !<INPUT 0>!
+Emoji:
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/insight_and_evidence_v1.txt b/metagpt/ext/stanford_town/prompts/insight_and_evidence_v1.txt
new file mode 100644
index 0000000000..35671023bc
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/insight_and_evidence_v1.txt
@@ -0,0 +1,12 @@
+insight_and_evidence_v1.txt
+
+Variables: 
+!<INPUT 0>! -- Numbered list of event/thought statements
+!<INPUT 1>! -- target persona name or "the conversation"
+
+<commentblockmarker>###</commentblockmarker>
+Input:
+!<INPUT 0>!
+
+What !<INPUT 1>! high-level insights can you infer from the above statements? Please ensure it includes 'because of' and generates according to the example format.(example format: insight (because of 1, 5, 3)) .
+1.
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/iterative_convo_v1.txt b/metagpt/ext/stanford_town/prompts/iterative_convo_v1.txt
new file mode 100644
index 0000000000..7bd4e72169
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/iterative_convo_v1.txt
@@ -0,0 +1,46 @@
+iterative_convo_v1.txt
+
+Variables: 
+!<INPUT 0>! -- persona ISS
+!<INPUT 1>! -- persona name
+!<INPUT 2>! -- retrieved memory
+!<INPUT 3>! -- past context
+!<INPUT 4>! -- current location
+!<INPUT 5>! -- current context
+!<INPUT 6>! -- persona name
+!<INPUT 7>! -- target persona name
+!<INPUT 8>! -- curr convo
+!<INPUT 9>! -- persona name
+!<INPUT 10>! -- target persona name
+!<INPUT 11>! -- persona name
+!<INPUT 12>! -- persona name
+!<INPUT 13>! -- persona name
+<commentblockmarker>###</commentblockmarker>
+Context for the task: 
+
+PART 1. 
+!<INPUT 0>!
+
+Here is the memory that is in !<INPUT 1>!'s head: 
+!<INPUT 2>!
+
+PART 2. 
+Past Context: 
+!<INPUT 3>!
+
+Current Location: !<INPUT 4>!
+
+Current Context: 
+!<INPUT 5>!
+
+!<INPUT 6>! and !<INPUT 7>! are chatting. Here is their conversation so far: 
+!<INPUT 8>!
+
+---
+Task: Given the above, what should !<INPUT 9>! say to !<INPUT 10>! next in the conversation? And did it end the conversation?
+
+Output format: Output a json of the following format: 
+{
+"!<INPUT 11>!": "<!<INPUT 12>!'s utterance>",
+"Did the conversation end with !<INPUT 13>!'s utterance?": "<json Boolean>"
+}
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/memo_on_convo_v1.txt b/metagpt/ext/stanford_town/prompts/memo_on_convo_v1.txt
new file mode 100644
index 0000000000..38b34bfbd1
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/memo_on_convo_v1.txt
@@ -0,0 +1,15 @@
+memo_on_convo_v1.txt
+
+Variables: 
+!<INPUT 0>! -- All convo utterances
+!<INPUT 1>! -- persona name
+!<INPUT 2>! -- persona name
+!<INPUT 3>! -- persona name
+
+<commentblockmarker>###</commentblockmarker>
+[Conversation]
+!<INPUT 0>!
+
+Write down if there is anything from the conversation that !<INPUT 1>! might have found interesting from !<INPUT 2>!'s perspective, in a full sentence. 
+
+"!<INPUT 3>!
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/new_decomp_schedule_v1.txt b/metagpt/ext/stanford_town/prompts/new_decomp_schedule_v1.txt
new file mode 100644
index 0000000000..e21dc69eb0
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/new_decomp_schedule_v1.txt
@@ -0,0 +1,24 @@
+new_decomp_schedule_v1.txt
+
+Variables: 
+!<INPUT 0>! -- persona name 
+!<INPUT 1>! -- start hour
+!<INPUT 2>! -- end hour 
+!<INPUT 3>! -- original plan
+!<INPUT 4>! -- persona name
+!<INPUT 5>! -- new event
+!<INPUT 6>! -- new event duration
+!<INPUT 7>! -- persona name 
+!<INPUT 8>! -- start hour
+!<INPUT 9>! -- end hour 
+!<INPUT 10>! -- end hour 
+!<INPUT 11>! -- new schedule init 
+
+
+<commentblockmarker>###</commentblockmarker>
+Here was !<INPUT 0>!'s originally planned schedule from !<INPUT 1>! to !<INPUT 2>!. 
+!<INPUT 3>!
+
+But !<INPUT 4>! unexpectedly ended up !<INPUT 5>! for !<INPUT 6>! minutes. Revise !<INPUT 7>!'s schedule from !<INPUT 8>! to !<INPUT 9>! accordingly (it has to end by !<INPUT 10>!). 
+The revised schedule:
+!<INPUT 11>!
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/planning_thought_on_convo_v1.txt b/metagpt/ext/stanford_town/prompts/planning_thought_on_convo_v1.txt
new file mode 100644
index 0000000000..0563dcee94
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/planning_thought_on_convo_v1.txt
@@ -0,0 +1,15 @@
+planning_thought_on_convo_v1.txt
+
+Variables: 
+!<INPUT 0>! -- All convo utterances
+!<INPUT 1>! -- persona name
+!<INPUT 2>! -- persona name
+!<INPUT 3>! -- persona name
+
+<commentblockmarker>###</commentblockmarker>
+[Conversation]
+!<INPUT 0>!
+
+Write down if there is anything from the conversation that !<INPUT 1>! need to remember for her planning, from !<INPUT 2>!'s perspective, in a full sentence.
+
+"!<INPUT 3>!
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/poignancy_action_v1.txt b/metagpt/ext/stanford_town/prompts/poignancy_action_v1.txt
new file mode 100644
index 0000000000..34975696b3
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/poignancy_action_v1.txt
@@ -0,0 +1,15 @@
+poignancy_event_v1.txt
+
+!<INPUT 1>!: agent name
+!<INPUT 1>!: iss
+!<INPUT 2>!: name 
+!<INPUT 3>!: event description
+
+<commentblockmarker>###</commentblockmarker>
+Here is a brief description of !<INPUT 0>!. 
+!<INPUT 1>!
+
+On the scale of 1 to 10, where 1 is purely mundane (e.g., brushing teeth, making bed) and 10 is extremely poignant (e.g., a break up, college acceptance), rate the likely poignancy of the following event for !<INPUT 2>!.
+
+Event: !<INPUT 3>!
+Rate (return a number between 1 to 10):
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/poignancy_chat_v1.txt b/metagpt/ext/stanford_town/prompts/poignancy_chat_v1.txt
new file mode 100644
index 0000000000..572dd8a05a
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/poignancy_chat_v1.txt
@@ -0,0 +1,17 @@
+poignancy_chat_v1.txt
+
+!<INPUT 1>!: agent name
+!<INPUT 1>!: iss
+!<INPUT 2>!: name 
+!<INPUT 3>!: event description
+
+<commentblockmarker>###</commentblockmarker>
+Here is a brief description of !<INPUT 0>!. 
+!<INPUT 1>!
+
+On the scale of 1 to 10, where 1 is purely mundane (e.g., routine morning greetings) and 10 is extremely poignant (e.g., a conversation about breaking up, a fight), rate the likely poignancy of the following conversation for !<INPUT 2>!.
+
+Conversation: 
+!<INPUT 3>!
+
+Rate (return a number between 1 to 10):
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/poignancy_event_v1.txt b/metagpt/ext/stanford_town/prompts/poignancy_event_v1.txt
new file mode 100644
index 0000000000..34975696b3
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/poignancy_event_v1.txt
@@ -0,0 +1,15 @@
+poignancy_event_v1.txt
+
+!<INPUT 1>!: agent name
+!<INPUT 1>!: iss
+!<INPUT 2>!: name 
+!<INPUT 3>!: event description
+
+<commentblockmarker>###</commentblockmarker>
+Here is a brief description of !<INPUT 0>!. 
+!<INPUT 1>!
+
+On the scale of 1 to 10, where 1 is purely mundane (e.g., brushing teeth, making bed) and 10 is extremely poignant (e.g., a break up, college acceptance), rate the likely poignancy of the following event for !<INPUT 2>!.
+
+Event: !<INPUT 3>!
+Rate (return a number between 1 to 10):
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/poignancy_thought_v1.txt b/metagpt/ext/stanford_town/prompts/poignancy_thought_v1.txt
new file mode 100644
index 0000000000..9a4db5166b
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/poignancy_thought_v1.txt
@@ -0,0 +1,15 @@
+poignancy_thought_v1.txt
+
+!<INPUT 1>!: agent name
+!<INPUT 1>!: iss
+!<INPUT 2>!: name 
+!<INPUT 3>!: event description
+
+<commentblockmarker>###</commentblockmarker>
+Here is a brief description of !<INPUT 0>!. 
+!<INPUT 1>!
+
+On the scale of 1 to 10, where 1 is purely mundane (e.g., I need to do the dishes, I need to walk the dog) and 10 is extremely significant (e.g., I wish to become a professor, I love Elie), rate the likely significance of the following thought for !<INPUT 2>!.
+
+Thought: !<INPUT 3>!
+Rate (return a number between 1 to 10):
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/summarize_chat_relationship_v2.txt b/metagpt/ext/stanford_town/prompts/summarize_chat_relationship_v2.txt
new file mode 100644
index 0000000000..6f71824da1
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/summarize_chat_relationship_v2.txt
@@ -0,0 +1,15 @@
+summarize_chat_relationship_v2.txt
+
+Variables: 
+!<INPUT 0>! -- Statements
+!<INPUT 1>! -- curr persona name
+!<INPUT 2>! -- target_persona.scratch.name
+
+<commentblockmarker>###</commentblockmarker>
+[Statements]
+!<INPUT 0>!
+
+Based on the statements above, summarize !<INPUT 1>! and !<INPUT 2>!'s relationship. What do they feel or know about each other?
+
+
+"
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/summarize_conversation_v1.txt b/metagpt/ext/stanford_town/prompts/summarize_conversation_v1.txt
new file mode 100644
index 0000000000..1cb423c7d7
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/summarize_conversation_v1.txt
@@ -0,0 +1,11 @@
+summarize_conversation_v1.txt
+
+Variables: 
+!<INPUT 0>! -- init_persona_name
+
+<commentblockmarker>###</commentblockmarker>
+Conversation: 
+!<INPUT 0>!
+
+Summarize the conversation above in one sentence:
+This is a conversation about
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/task_decomp_v3.txt b/metagpt/ext/stanford_town/prompts/task_decomp_v3.txt
new file mode 100644
index 0000000000..2ba016c217
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/task_decomp_v3.txt
@@ -0,0 +1,39 @@
+task_decomp_v2.txt
+
+Variables: 
+!<INPUT 0>! -- Commonset
+!<INPUT 1>! -- Surrounding schedule description
+!<INPUT 2>! -- Persona first name
+!<INPUT 3>! -- Persona first name
+!<INPUT 4>! -- Current action
+!<INPUT 5>! -- curr time range
+!<INPUT 6>! -- Current action duration in min
+!<INPUT 7>! -- Persona first names
+
+<commentblockmarker>###</commentblockmarker>
+Describe subtasks in 5 min increments. 
+---
+Name: Kelly Bronson
+Age: 35
+Backstory: Kelly always wanted to be a teacher, and now she teaches kindergarten. During the week, she dedicates herself to her students, but on the weekends, she likes to try out new restaurants and hang out with friends. She is very warm and friendly, and loves caring for others.
+Personality: sweet, gentle, meticulous
+Location: Kelly is in an older condo that has the following areas: {kitchen, bedroom, dining, porch, office, bathroom, living room, hallway}.
+Currently: Kelly is a teacher during the school year. She teaches at the school but works on lesson plans at home. She is currently living alone in a single bedroom condo.
+Daily plan requirement: Kelly is planning to teach during the morning and work from home in the afternoon.s
+
+Today is Saturday May 10. From 08:00am ~09:00am, Kelly is planning on having breakfast, from 09:00am ~ 12:00pm, Kelly is planning on working on the next day's kindergarten lesson plan, and from 12:00 ~ 13pm, Kelly is planning on taking a break. 
+In 5 min increments, list the subtasks Kelly does when Kelly is working on the next day's kindergarten lesson plan from 09:00am ~ 12:00pm (total duration in minutes: 180):
+1) Kelly is reviewing the kindergarten curriculum standards. (duration in minutes: 15, minutes left: 165)
+2) Kelly is brainstorming ideas for the lesson. (duration in minutes: 30, minutes left: 135)
+3) Kelly is creating the lesson plan. (duration in minutes: 30, minutes left: 105)
+4) Kelly is creating materials for the lesson. (duration in minutes: 30, minutes left: 75)
+5) Kelly is taking a break. (duration in minutes: 15, minutes left: 60)
+6) Kelly is reviewing the lesson plan. (duration in minutes: 30, minutes left: 30)
+7) Kelly is making final changes to the lesson plan. (duration in minutes: 15, minutes left: 15)
+8) Kelly is printing the lesson plan. (duration in minutes: 10, minutes left: 5)
+9) Kelly is putting the lesson plan in her bag. (duration in minutes: 5, minutes left: 0)
+---
+!<INPUT 0>!
+!<INPUT 1>!
+In 5 min increments, list the subtasks !<INPUT 2>! does when !<INPUT 3>! is !<INPUT 4>! from !<INPUT 5>! (total duration in minutes !<INPUT 6>!): 
+1) !<INPUT 7>! is
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/wake_up_hour_v1.txt b/metagpt/ext/stanford_town/prompts/wake_up_hour_v1.txt
new file mode 100644
index 0000000000..c0a635654c
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/wake_up_hour_v1.txt
@@ -0,0 +1,12 @@
+wake_up_hour_v1.txt
+
+Variables: 
+!<INPUT 0>! -- Identity Stable Set
+!<INPUT 1>! -- Lifestyle
+!<INPUT 2>! -- Persona first names
+
+<commentblockmarker>###</commentblockmarker>
+!<INPUT 0>!
+
+In general, !<INPUT 1>!
+!<INPUT 2>!'s wake up hour:
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/whisper_inner_thought_v1.txt b/metagpt/ext/stanford_town/prompts/whisper_inner_thought_v1.txt
new file mode 100644
index 0000000000..b1ed50aaae
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/whisper_inner_thought_v1.txt
@@ -0,0 +1,11 @@
+whisper_inner_thought_v1.txt
+
+Variables: 
+!<INPUT 0>! -- init persona name
+!<INPUT 1>! -- whisper
+
+<commentblockmarker>###</commentblockmarker>
+Translate the following thought into a statement about !<INPUT 0>!. 
+
+Thought: "!<INPUT 1>!"
+Statement: "
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/reflect/__init__.py b/metagpt/ext/stanford_town/reflect/__init__.py
new file mode 100644
index 0000000000..da486a131c
--- /dev/null
+++ b/metagpt/ext/stanford_town/reflect/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : reflection module
diff --git a/metagpt/ext/stanford_town/reflect/reflect.py b/metagpt/ext/stanford_town/reflect/reflect.py
new file mode 100644
index 0000000000..954cbc1ac5
--- /dev/null
+++ b/metagpt/ext/stanford_town/reflect/reflect.py
@@ -0,0 +1,245 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : Reflect function
+
+import datetime
+import time
+
+from metagpt.ext.stanford_town.actions.run_reflect_action import (
+    AgentChatPoignancy,
+    AgentEventPoignancy,
+    AgentEventTriple,
+    AgentFocusPt,
+    AgentInsightAndGuidance,
+    AgentMemoryOnConvo,
+    AgentPlanThoughtOnConvo,
+)
+from metagpt.ext.stanford_town.memory.retrieve import new_agent_retrieve
+from metagpt.ext.stanford_town.utils.utils import get_embedding
+from metagpt.logs import logger
+
+
+async def generate_focal_points(role: "STRole", n: int = 3):
+    nodes = [
+        [i.last_accessed, i] for i in role.memory.event_list + role.memory.thought_list if "idle" not in i.embedding_key
+    ]
+    nodes = sorted(nodes, key=lambda x: x[0])
+    nodes = [i for _, i in nodes]
+
+    statements = ""
+    for node in nodes[-1 * role.scratch.importance_ele_n :]:
+        statements += node.embedding_key + "\n"
+    run_focal_pt = AgentFocusPt()
+    return await run_focal_pt.run(role, statements, n)
+
+
+async def generate_insights_and_evidence(role: "STRole", nodes: list, n: int = 5):
+    statements = ""
+    for count, node in enumerate(nodes):
+        statements += f"{str(count)}. {node.embedding_key}\n"
+    run_insight_and_guidance = AgentInsightAndGuidance()
+    ret = await run_insight_and_guidance.run(role, statements, n)
+
+    logger.info(ret)
+
+    try:
+        for thought, evi_raw in ret.items():
+            evidence_node_id = [nodes[i].memory_id for i in evi_raw]
+            ret[thought] = evidence_node_id
+        return ret
+    except Exception as exp:
+        logger.error(f"generate_insights_and_evidence error:{exp}")
+        return {"this is blank": "node_1"}
+
+
+async def generate_action_event_triple(act_desp: str, role: "STRole"):
+    """TODO
+
+    INPUT:
+        act_desp: the description of the action (e.g., "sleeping")
+        role: The Persona class instance
+    OUTPUT:
+        a string of emoji that translates action description.
+    EXAMPLE OUTPUT:
+        "🧈🍞"
+    """
+    run_event_triple = AgentEventTriple()
+    result = await run_event_triple.run(act_desp, role)
+    return result
+
+
+async def generate_poig_score(role: "STRole", event_type: str, description: str):
+    if "is idle" in description:
+        return 1
+
+    if event_type == "event" or event_type == "thought":
+        run_event_poignancy = AgentEventPoignancy()
+        return await run_event_poignancy.run(role, description)
+    elif event_type == "chat":
+        run_chat_poignancy = AgentChatPoignancy()
+        return await run_chat_poignancy.run(role, role.scratch.act_description)
+
+
+async def generate_planning_thought_on_convo(role: "STRole", all_utt: str):
+    run_planning_on_convo = AgentPlanThoughtOnConvo()
+    return await run_planning_on_convo.run(role, all_utt)
+
+
+async def generate_memo_on_convo(role: "STRole", all_utt: str):
+    run_memo_on_convo = AgentMemoryOnConvo()
+    return await run_memo_on_convo.run(role, all_utt)
+
+
+# Done
+async def run_reflect(role: "STRole"):
+    """
+    Run the actual reflection. We generate the focal points, retrieve any
+    relevant nodes, and generate thoughts and insights.
+
+    INPUT:
+        role: Current Persona object
+    Output:
+        None
+    """
+    # Reflection requires certain focal points. Generate that first.
+    focal_points = await generate_focal_points(role, 3)
+    # Retrieve the relevant Nodesobject for each of the focal points.
+    # <retrieved> has keys of focal points, and values of the associated Nodes.
+    retrieved = new_agent_retrieve(role, focal_points)
+
+    # For each of the focal points, generate thoughts and save it in the
+    # agent's memory.
+    for focal_pt, nodes in retrieved.items():
+        xx = [i.embedding_key for i in nodes]
+        for xxx in xx:
+            logger.info(f"Nodes retrieved for `{focal_pt}` are `{xxx}`.")
+
+        thoughts = await generate_insights_and_evidence(role, nodes, 5)
+        # 生成的是字典类型
+        for thought, evidence in thoughts.items():
+            created = role.scratch.curr_time
+            expiration = created + datetime.timedelta(days=30)
+            s, p, o = await generate_action_event_triple("(" + thought + ")", role)
+            keywords = set([s, p, o])
+            thought_poignancy = await generate_poig_score(role, "thought", thought)
+            thought_embedding_pair = (thought, get_embedding(thought))
+
+            role.memory.add_thought(
+                created, expiration, s, p, o, thought, keywords, thought_poignancy, thought_embedding_pair, evidence
+            )
+            logger.info(f"add thought memory: {thought}, evidence: {evidence}")
+            time.sleep(2)  # avoid Rate limit
+
+
+def reflection_trigger(role: "STRole"):
+    """
+    Given the current role, determine whether the role should run a
+    reflection.
+
+    Our current implementation checks for whether the sum of the new importance
+    measure has reached the set (hyper-parameter) threshold.
+
+    INPUT:
+        role: Current Persona object
+    Output:
+        True if we are running a new reflection.
+        False otherwise.
+    """
+    logger.info(f"{role.scratch.name} role.scratch.importance_trigger_curr:: {role.scratch.importance_trigger_curr}"),
+
+    if role.scratch.importance_trigger_curr <= 0 and [] != role.memory.event_list + role.memory.thought_list:
+        return True
+    return False
+
+
+# Done
+def reset_reflection_counter(role: "STRole"):
+    """
+    We reset the counters used for the reflection trigger.
+
+    INPUT:
+        role: Current Persona object
+    Output:
+        None
+    """
+    role_imt_max = role.scratch.importance_trigger_max
+    role.scratch.importance_trigger_curr = role_imt_max
+    role.scratch.importance_ele_n = 0
+
+
+async def role_reflect(role: "STRole"):
+    """
+    The main reflection module for the role. We first check if the trigger
+    conditions are met, and if so, run the reflection and reset any of the
+    relevant counters.
+
+    INPUT:
+        role: Current Persona object
+    Output:
+        None
+    """
+    if reflection_trigger(role):
+        await run_reflect(role)
+        reset_reflection_counter(role)
+
+    if role.scratch.chatting_end_time:
+        # update 10 to it's real sec_per_step value
+        if role.scratch.curr_time + datetime.timedelta(0, role.sec_per_step) == role.scratch.chatting_end_time:
+            all_utt = ""
+            if role.scratch.chat:
+                for row in role.scratch.chat:
+                    all_utt += f"{row[0]}: {row[1]}\n"
+
+            last_chat = role.memory.get_last_chat(role.scratch.chatting_with)
+            if last_chat:
+                evidence = [last_chat.memory_id]
+            else:
+                logger.info(f"Role: {role.name} get_last_chat: {last_chat}")
+                return
+
+            planning_thought = await generate_planning_thought_on_convo(role, all_utt)
+            planning_thought = f"For {role.scratch.name}'s planning: {planning_thought}"
+            logger.info(f"Role: {role.name} planning_thought: {planning_thought}")
+
+            created = role.scratch.curr_time
+            expiration = created + datetime.timedelta(days=30)
+            s, p, o = await generate_action_event_triple(planning_thought, role)
+            keywords = set([s, p, o])
+            thought_poignancy = await generate_poig_score(role, "thought", planning_thought)
+            thought_embedding_pair = (planning_thought, get_embedding(planning_thought))
+
+            role.memory.add_thought(
+                created,
+                expiration,
+                s,
+                p,
+                o,
+                planning_thought,
+                keywords,
+                thought_poignancy,
+                thought_embedding_pair,
+                evidence,
+            )
+
+            memo_thought = await generate_memo_on_convo(role, all_utt)
+            memo_thought = f"{role.scratch.name} {memo_thought}"
+
+            created = role.scratch.curr_time
+            expiration = created + datetime.timedelta(days=30)
+            s, p, o = await generate_action_event_triple(memo_thought, role)
+            keywords = set([s, p, o])
+            thought_poignancy = await generate_poig_score(role, "thought", memo_thought)
+            thought_embedding_pair = (memo_thought, get_embedding(memo_thought))
+
+            role.memory.add_thought(
+                created,
+                expiration,
+                s,
+                p,
+                o,
+                memo_thought,
+                keywords,
+                thought_poignancy,
+                thought_embedding_pair,
+                evidence,
+            )
diff --git a/metagpt/ext/stanford_town/roles/__init__.py b/metagpt/ext/stanford_town/roles/__init__.py
new file mode 100644
index 0000000000..2bcf8efd09
--- /dev/null
+++ b/metagpt/ext/stanford_town/roles/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/metagpt/ext/stanford_town/roles/st_role.py b/metagpt/ext/stanford_town/roles/st_role.py
new file mode 100644
index 0000000000..79f58b07d2
--- /dev/null
+++ b/metagpt/ext/stanford_town/roles/st_role.py
@@ -0,0 +1,640 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : Stanford Town role
+
+"""
+Do the steps following:
+- perceive, receive environment(Maze) info
+- retrieve, retrieve memories
+- plan, do plan like long-term plan and interact with Maze
+- reflect, do the High-level thinking based on memories and re-add into the memory
+- execute, move or else in the Maze
+"""
+import math
+import random
+import time
+from datetime import datetime, timedelta
+from operator import itemgetter
+from pathlib import Path
+from typing import TYPE_CHECKING, Optional
+
+from pydantic import ConfigDict, Field, field_validator, model_validator
+
+from metagpt.actions.add_requirement import UserRequirement
+from metagpt.environment.stanford_town.env_space import (
+    EnvAction,
+    EnvActionType,
+    EnvObsParams,
+    EnvObsType,
+)
+from metagpt.ext.stanford_town.actions.dummy_action import DummyAction, DummyMessage
+from metagpt.ext.stanford_town.actions.inner_voice_action import (
+    AgentWhisperThoughtAction,
+)
+from metagpt.ext.stanford_town.actions.run_reflect_action import AgentEventTriple
+from metagpt.ext.stanford_town.memory.agent_memory import AgentMemory, BasicMemory
+from metagpt.ext.stanford_town.memory.scratch import Scratch
+from metagpt.ext.stanford_town.memory.spatial_memory import MemoryTree
+from metagpt.ext.stanford_town.plan.st_plan import plan
+from metagpt.ext.stanford_town.reflect.reflect import generate_poig_score, role_reflect
+from metagpt.ext.stanford_town.utils.const import STORAGE_PATH, collision_block_id
+from metagpt.ext.stanford_town.utils.mg_ga_transform import (
+    get_role_environment,
+    save_environment,
+    save_movement,
+)
+from metagpt.ext.stanford_town.utils.utils import get_embedding, path_finder
+from metagpt.logs import logger
+from metagpt.roles.role import Role, RoleContext
+from metagpt.schema import Message
+from metagpt.utils.common import any_to_str
+
+if TYPE_CHECKING:
+    from metagpt.environment.stanford_town.stanford_town_env import (  # noqa: F401
+        StanfordTownEnv,
+    )
+
+
+class STRoleContext(RoleContext):
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+
+    env: "StanfordTownEnv" = Field(default=None, exclude=True)
+    memory: AgentMemory = Field(default_factory=AgentMemory)
+    scratch: Scratch = Field(default_factory=Scratch)
+    spatial_memory: MemoryTree = Field(default_factory=MemoryTree)
+
+    @classmethod
+    def model_rebuild(cls, **kwargs):
+        from metagpt.environment.stanford_town.stanford_town_env import (  # noqa: F401
+            StanfordTownEnv,
+        )
+
+        super(RoleContext, cls).model_rebuild(**kwargs)
+
+
+class STRole(Role):
+    # add a role's property structure to store role's age and so on like GA's Scratch.
+    model_config = ConfigDict(arbitrary_types_allowed=True, extra="allow")
+
+    name: str = Field(default="Klaus Mueller")
+    profile: str = Field(default="STMember")
+
+    rc: STRoleContext = Field(default_factory=STRoleContext)
+
+    sim_code: str = Field(default="new_sim")
+    step: int = Field(default=0)
+    start_time: Optional[datetime] = Field(default=None)
+    curr_time: Optional[datetime] = Field(default=None)
+    sec_per_step: int = Field(default=10)
+    game_obj_cleanup: dict = Field(default_factory=dict)
+    inner_voice: bool = Field(default=False)
+    has_inner_voice: bool = Field(default=False)
+
+    role_storage_path: Optional[Path] = Field(default=None)
+
+    @field_validator("curr_time", mode="before")
+    @classmethod
+    def check_curr_time(cls, curr_time: str) -> datetime:
+        return datetime.strptime(curr_time, "%B %d, %Y, %H:%M:%S")
+
+    @field_validator("start_time", mode="before")
+    @classmethod
+    def check_start_time(cls, start_time: str) -> datetime:
+        return datetime.strptime(f"{start_time}, 00:00:00", "%B %d, %Y, %H:%M:%S")
+
+    @model_validator(mode="after")
+    def validate_st_role_after(self):
+        self.role_storage_path = STORAGE_PATH.joinpath(f"{self.sim_code}/personas/{self.name}")
+
+        self.load_from()  # load role's memory
+
+        self.set_actions([])
+
+        if self.has_inner_voice:
+            # TODO add communication action
+            self._watch([UserRequirement, DummyAction])
+        else:
+            self._watch([DummyAction])
+
+    async def init_curr_tile(self):
+        # init role
+        role_env: dict = get_role_environment(self.sim_code, self.name, self.step)
+        pt_x = role_env["x"]
+        pt_y = role_env["y"]
+        self.rc.scratch.curr_tile = (pt_x, pt_y)
+
+        self.rc.env.step(
+            EnvAction(
+                action_type=EnvActionType.ADD_TILE_EVENT,
+                coord=(pt_x, pt_y),
+                event=self.scratch.get_curr_event_and_desc(),
+            )
+        )
+
+    @property
+    def scratch(self):
+        return self.rc.scratch
+
+    @property
+    def role_tile(self):
+        return self.scratch.curr_tile
+
+    @property
+    def a_mem(self):
+        return self.rc.memory
+
+    @property
+    def s_mem(self):
+        return self.rc.spatial_memory
+
+    @property
+    def memory(self):
+        return self.rc.memory
+
+    def load_from(self):
+        """
+        load role data from `storage/{simulation_name}/personas/{role_name}`
+        """
+        memory_saved = self.role_storage_path.joinpath("bootstrap_memory/associative_memory")
+        self.rc.memory.set_mem_path(memory_saved)
+
+        sp_mem_saved = self.role_storage_path.joinpath("bootstrap_memory/spatial_memory.json")
+        self.rc.spatial_memory.set_mem_path(f_saved=sp_mem_saved)
+
+        scratch_f_saved = self.role_storage_path.joinpath("bootstrap_memory/scratch.json")
+        self.rc.scratch = Scratch.init_scratch_from_path(f_saved=scratch_f_saved)
+
+        logger.info(f"Role: {self.name} loaded role's memory from {str(self.role_storage_path)}")
+
+    def save_into(self):
+        """
+        save role data from `storage/{simulation_name}/personas/{role_name}`
+        """
+        memory_saved = self.role_storage_path.joinpath("bootstrap_memory/associative_memory")
+        self.rc.memory.save(memory_saved)
+
+        sp_mem_saved = self.role_storage_path.joinpath("bootstrap_memory/spatial_memory.json")
+        self.rc.spatial_memory.save(sp_mem_saved)
+
+        scratch_f_saved = self.role_storage_path.joinpath("bootstrap_memory/scratch.json")
+        self.rc.scratch.save(scratch_f_saved)
+
+        logger.info(f"Role: {self.name} saved role's memory into {str(self.role_storage_path)}")
+
+    async def _observe(self, ignore_memory=False) -> int:
+        if not self.rc.env:
+            return 0
+        news = []
+        if not news:
+            news = self.rc.msg_buffer.pop_all()
+        old_messages = [] if ignore_memory else self.rc.memory.get()
+        # Filter out messages of interest.
+        self.rc.news = [
+            n for n in news if (n.cause_by in self.rc.watch or self.name in n.send_to) and n not in old_messages
+        ]
+
+        if len(self.rc.news) == 1 and self.rc.news[0].cause_by == any_to_str(UserRequirement):
+            logger.warning(f"Role: {self.name} add inner voice: {self.rc.news[0].content}")
+            await self.add_inner_voice(self.rc.news[0].content)
+
+        return 1  # always return 1 to execute role's `_react`
+
+    async def add_inner_voice(self, whisper: str):
+        async def generate_inner_thought(whisper: str):
+            run_whisper_thought = AgentWhisperThoughtAction()
+            inner_thought = await run_whisper_thought.run(self, whisper)
+            return inner_thought
+
+        thought = await generate_inner_thought(whisper)
+
+        # init scratch curr_time with self.curr_time
+        self.inner_voice = True
+        self.rc.scratch.curr_time = self.curr_time
+
+        created = self.rc.scratch.curr_time if self.rc.scratch.curr_time else datetime.now()
+        expiration = created + timedelta(days=30)
+        run_event_triple = AgentEventTriple()
+        s, p, o = await run_event_triple.run(thought, self)
+        keywords = set([s, p, o])
+        thought_poignancy = await generate_poig_score(self, "event", whisper)
+        thought_embedding_pair = (thought, get_embedding(thought))
+        self.rc.memory.add_thought(
+            created, expiration, s, p, o, thought, keywords, thought_poignancy, thought_embedding_pair, None
+        )
+
+    async def observe(self) -> list[BasicMemory]:
+        # TODO observe info from maze_env
+        """
+        Perceive events around the role and saves it to the memory, both events
+        and spaces.
+
+        We first perceive the events nearby the role, as determined by its
+        <vision_r>. If there are a lot of events happening within that radius, we
+        take the <att_bandwidth> of the closest events. Finally, we check whether
+        any of them are new, as determined by <retention>. If they are new, then we
+        save those and return the <BasicMemory> instances for those events.
+
+        OUTPUT:
+            ret_events: a list of <BasicMemory> that are perceived and new.
+        """
+        # PERCEIVE SPACE
+        # We get the nearby tiles given our current tile and the persona's vision
+        # radius.
+        nearby_tiles = self.rc.env.observe(
+            EnvObsParams(
+                obs_type=EnvObsType.TILE_NBR, coord=self.rc.scratch.curr_tile, vision_radius=self.rc.scratch.vision_r
+            )
+        )
+
+        # We then store the perceived space. Note that the s_mem of the persona is
+        # in the form of a tree constructed using dictionaries.
+        for tile in nearby_tiles:
+            tile_info = self.rc.env.observe(EnvObsParams(obs_type=EnvObsType.GET_TITLE, coord=tile))
+            self.rc.spatial_memory.add_tile_info(tile_info)
+
+        # PERCEIVE EVENTS.
+        # We will perceive events that take place in the same arena as the
+        # persona's current arena.
+
+        curr_arena_path = self.rc.env.observe(
+            EnvObsParams(obs_type=EnvObsType.TILE_PATH, coord=self.rc.scratch.curr_tile, level="arena")
+        )
+
+        # We do not perceive the same event twice (this can happen if an object is
+        # extended across multiple tiles).
+        percept_events_set = set()
+        # We will order our percept based on the distance, with the closest ones
+        # getting priorities.
+        percept_events_list = []
+        # First, we put all events that are occuring in the nearby tiles into the
+        # percept_events_list
+        for tile in nearby_tiles:
+            tile_details = self.rc.env.observe(EnvObsParams(obs_type=EnvObsType.GET_TITLE, coord=tile))
+            if tile_details["events"]:
+                tmp_arena_path = self.rc.env.observe(
+                    EnvObsParams(obs_type=EnvObsType.TILE_PATH, coord=tile, level="arena")
+                )
+
+                if tmp_arena_path == curr_arena_path:
+                    # This calculates the distance between the persona's current tile,
+                    # and the target tile.
+                    dist = math.dist([tile[0], tile[1]], [self.rc.scratch.curr_tile[0], self.rc.scratch.curr_tile[1]])
+                    # Add any relevant events to our temp set/list with the distant info.
+                    for event in tile_details["events"]:
+                        if event not in percept_events_set:
+                            percept_events_list += [[dist, event]]
+                            percept_events_set.add(event)
+
+        # We sort, and perceive only self.rc.scratch.att_bandwidth of the closest
+        # events. If the bandwidth is larger, then it means the persona can perceive
+        # more elements within a small area.
+        percept_events_list = sorted(percept_events_list, key=itemgetter(0))
+        perceived_events = []
+        for dist, event in percept_events_list[: self.rc.scratch.att_bandwidth]:
+            perceived_events += [event]
+
+        # Storing events.
+        # <ret_events> is a list of <BasicMemory> instances from the persona's
+        # associative memory.
+        ret_events = []
+        for p_event in perceived_events:
+            s, p, o, desc = p_event
+            if not p:
+                # If the object is not present, then we default the event to "idle".
+                p = "is"
+                o = "idle"
+                desc = "idle"
+            desc = f"{s.split(':')[-1]} is {desc}"
+            p_event = (s, p, o)
+
+            # We retrieve the latest self.rc.scratch.retention events. If there is
+            # something new that is happening (that is, p_event not in latest_events),
+            # then we add that event to the a_mem and return it.
+            latest_events = self.rc.memory.get_summarized_latest_events(self.rc.scratch.retention)
+            if p_event not in latest_events:
+                # We start by managing keywords.
+                keywords = set()
+                sub = p_event[0]
+                obj = p_event[2]
+                if ":" in p_event[0]:
+                    sub = p_event[0].split(":")[-1]
+                if ":" in p_event[2]:
+                    obj = p_event[2].split(":")[-1]
+                keywords.update([sub, obj])
+
+                # Get event embedding
+                desc_embedding_in = desc
+                if "(" in desc:
+                    desc_embedding_in = desc_embedding_in.split("(")[1].split(")")[0].strip()
+                if desc_embedding_in in self.rc.memory.embeddings:
+                    event_embedding = self.rc.memory.embeddings[desc_embedding_in]
+                else:
+                    event_embedding = get_embedding(desc_embedding_in)
+                event_embedding_pair = (desc_embedding_in, event_embedding)
+
+                # Get event poignancy.
+                event_poignancy = await generate_poig_score(self, "event", desc_embedding_in)
+                logger.debug(f"Role {self.name} event_poignancy: {event_poignancy}")
+
+                # If we observe the persona's self chat, we include that in the memory
+                # of the persona here.
+                chat_node_ids = []
+                if p_event[0] == f"{self.name}" and p_event[1] == "chat with":
+                    curr_event = self.rc.scratch.act_event
+                    if self.rc.scratch.act_description in self.rc.memory.embeddings:
+                        chat_embedding = self.rc.memory.embeddings[self.rc.scratch.act_description]
+                    else:
+                        chat_embedding = get_embedding(self.rc.scratch.act_description)
+                    chat_embedding_pair = (self.rc.scratch.act_description, chat_embedding)
+                    chat_poignancy = await generate_poig_score(self, "chat", self.rc.scratch.act_description)
+                    chat_node = self.rc.memory.add_chat(
+                        self.rc.scratch.curr_time,
+                        None,
+                        curr_event[0],
+                        curr_event[1],
+                        curr_event[2],
+                        self.rc.scratch.act_description,
+                        keywords,
+                        chat_poignancy,
+                        chat_embedding_pair,
+                        self.rc.scratch.chat,
+                    )
+                    chat_node_ids = [chat_node.memory_id]
+
+                # Finally, we add the current event to the agent's memory.
+                ret_events += [
+                    self.rc.memory.add_event(
+                        self.rc.scratch.curr_time,
+                        None,
+                        s,
+                        p,
+                        o,
+                        desc,
+                        keywords,
+                        event_poignancy,
+                        event_embedding_pair,
+                        chat_node_ids,
+                    )
+                ]
+                self.rc.scratch.importance_trigger_curr -= event_poignancy
+                self.rc.scratch.importance_ele_n += 1
+
+        return ret_events
+
+    def retrieve(self, observed: list) -> dict:
+        # TODO retrieve memories from agent_memory
+        retrieved = dict()
+        for event in observed:
+            retrieved[event.description] = dict()
+            retrieved[event.description]["curr_event"] = event
+
+            relevant_events = self.rc.memory.retrieve_relevant_events(event.subject, event.predicate, event.object)
+            retrieved[event.description]["events"] = list(relevant_events)
+
+            relevant_thoughts = self.rc.memory.retrieve_relevant_thoughts(event.subject, event.predicate, event.object)
+            retrieved[event.description]["thoughts"] = list(relevant_thoughts)
+
+        return retrieved
+
+    async def reflect(self):
+        # TODO reflection if meet reflect condition
+        await role_reflect(self)
+        # TODO re-add result to memory
+        # 已封装到Reflect函数之中
+
+    async def execute(self, plan: str):
+        """
+        Args:
+            plan: This is a string address of the action we need to execute.
+            It comes in the form of "{world}:{sector}:{arena}:{game_objects}".
+            It is important that you access this without doing negative
+            indexing (e.g., [-1]) because the latter address elements may not be
+            present in some cases.
+            e.g., "dolores double studio:double studio:bedroom 1:bed"
+        """
+        roles = self.rc.env.get_roles()
+        if "<random>" in plan and self.rc.scratch.planned_path == []:
+            self.rc.scratch.act_path_set = False
+
+        # <act_path_set> is set to True if the path is set for the current action.
+        # It is False otherwise, and means we need to construct a new path.
+        if not self.rc.scratch.act_path_set:
+            # <target_tiles> is a list of tile coordinates where the persona may go
+            # to execute the current action. The goal is to pick one of them.
+            target_tiles = None
+            logger.info(f"Role {self.name} plan: {plan}")
+
+            if "<persona>" in plan:
+                # Executing persona-persona interaction.
+                target_p_tile = roles[plan.split("<persona>")[-1].strip()].scratch.curr_tile
+                collision_maze = self.rc.env.observe()["collision_maze"]
+                potential_path = path_finder(
+                    collision_maze, self.rc.scratch.curr_tile, target_p_tile, collision_block_id
+                )
+                if len(potential_path) <= 2:
+                    target_tiles = [potential_path[0]]
+                else:
+                    collision_maze = self.rc.env.observe()["collision_maze"]
+                    potential_1 = path_finder(
+                        collision_maze,
+                        self.rc.scratch.curr_tile,
+                        potential_path[int(len(potential_path) / 2)],
+                        collision_block_id,
+                    )
+
+                    potential_2 = path_finder(
+                        collision_maze,
+                        self.rc.scratch.curr_tile,
+                        potential_path[int(len(potential_path) / 2) + 1],
+                        collision_block_id,
+                    )
+                    if len(potential_1) <= len(potential_2):
+                        target_tiles = [potential_path[int(len(potential_path) / 2)]]
+                    else:
+                        target_tiles = [potential_path[int(len(potential_path) / 2 + 1)]]
+
+            elif "<waiting>" in plan:
+                # Executing interaction where the persona has decided to wait before
+                # executing their action.
+                x = int(plan.split()[1])
+                y = int(plan.split()[2])
+                target_tiles = [[x, y]]
+
+            elif "<random>" in plan:
+                # Executing a random location action.
+                plan = ":".join(plan.split(":")[:-1])
+
+                address_tiles = self.rc.env.observe()["address_tiles"]
+                target_tiles = address_tiles[plan]
+                target_tiles = random.sample(list(target_tiles), 1)
+
+            else:
+                # This is our default execution. We simply take the persona to the
+                # location where the current action is taking place.
+                # Retrieve the target addresses. Again, plan is an action address in its
+                # string form. <maze.address_tiles> takes this and returns candidate
+                # coordinates.
+                address_tiles = self.rc.env.observe()["address_tiles"]
+                if plan not in address_tiles:
+                    address_tiles["Johnson Park:park:park garden"]  # ERRORRRRRRR
+                else:
+                    target_tiles = address_tiles[plan]
+
+            # There are sometimes more than one tile returned from this (e.g., a tabe
+            # may stretch many coordinates). So, we sample a few here. And from that
+            # random sample, we will take the closest ones.
+            if len(target_tiles) < 4:
+                target_tiles = random.sample(list(target_tiles), len(target_tiles))
+            else:
+                target_tiles = random.sample(list(target_tiles), 4)
+            # If possible, we want personas to occupy different tiles when they are
+            # headed to the same location on the maze. It is ok if they end up on the
+            # same time, but we try to lower that probability.
+            # We take care of that overlap here.
+            persona_name_set = set(roles.keys())
+            new_target_tiles = []
+            for i in target_tiles:
+                access_tile = self.rc.env.observe(EnvObsParams(obs_type=EnvObsType.GET_TITLE, coord=i))
+                curr_event_set = access_tile["events"]
+                pass_curr_tile = False
+                for j in curr_event_set:
+                    if j[0] in persona_name_set:
+                        pass_curr_tile = True
+                if not pass_curr_tile:
+                    new_target_tiles += [i]
+            if len(new_target_tiles) == 0:
+                new_target_tiles = target_tiles
+            target_tiles = new_target_tiles
+
+            # Now that we've identified the target tile, we find the shortest path to
+            # one of the target tiles.
+            curr_tile = self.rc.scratch.curr_tile
+            closest_target_tile = None
+            path = None
+            for i in target_tiles:
+                # path_finder takes a collision_mze and the curr_tile coordinate as
+                # an input, and returns a list of coordinate tuples that becomes the
+                # path.
+                # e.g., [(0, 1), (1, 1), (1, 2), (1, 3), (1, 4)...]
+                collision_maze = self.rc.env.observe()["collision_maze"]
+                curr_path = path_finder(collision_maze, curr_tile, i, collision_block_id)
+                if not closest_target_tile:
+                    closest_target_tile = i
+                    path = curr_path
+                elif len(curr_path) < len(path):
+                    closest_target_tile = i
+                    path = curr_path
+
+            # Actually setting the <planned_path> and <act_path_set>. We cut the
+            # first element in the planned_path because it includes the curr_tile.
+            self.rc.scratch.planned_path = path[1:]
+            self.rc.scratch.act_path_set = True
+
+        # Setting up the next immediate step. We stay at our curr_tile if there is
+        # no <planned_path> left, but otherwise, we go to the next tile in the path.
+        ret = self.rc.scratch.curr_tile
+        if self.rc.scratch.planned_path:
+            ret = self.rc.scratch.planned_path[0]
+            self.rc.scratch.planned_path = self.rc.scratch.planned_path[1:]
+
+        description = f"{self.rc.scratch.act_description}"
+        description += f" @ {self.rc.scratch.act_address}"
+
+        execution = ret, self.rc.scratch.act_pronunciatio, description
+        return execution
+
+    async def update_role_env(self) -> bool:
+        role_env = get_role_environment(self.sim_code, self.name, self.step)
+        ret = True
+        if role_env:
+            for key, val in self.game_obj_cleanup.items():
+                self.rc.env.step(EnvAction(action_type=EnvActionType.TURN_TILE_EVENT_IDLE, coord=val, event=key))
+
+            # reset game_obj_cleanup
+            self.game_obj_cleanup = dict()
+            curr_tile = self.role_tile
+            new_tile = (role_env["x"], role_env["y"])
+            self.rc.env.step(
+                EnvAction(action_type=EnvActionType.RM_TITLE_SUB_EVENT, coord=curr_tile, subject=self.name)
+            )
+            self.rc.env.step(
+                EnvAction(
+                    action_type=EnvActionType.ADD_TILE_EVENT,
+                    coord=new_tile,
+                    event=self.scratch.get_curr_event_and_desc(),
+                )
+            )
+
+            # the persona will travel to get to their destination. *Once*
+            # the persona gets there, we activate the object action.
+            if not self.scratch.planned_path:
+                self.game_obj_cleanup[self.scratch.get_curr_event_and_desc()] = new_tile
+                self.rc.env.step(
+                    EnvAction(
+                        action_type=EnvActionType.ADD_TILE_EVENT,
+                        coord=new_tile,
+                        event=self.scratch.get_curr_event_and_desc(),
+                    )
+                )
+
+                blank = (self.scratch.get_curr_obj_event_and_desc()[0], None, None, None)
+                self.rc.env.step(EnvAction(action_type=EnvActionType.RM_TILE_EVENT, coord=new_tile, event=blank))
+
+            # update role's new tile
+            self.rc.scratch.curr_tile = new_tile
+        else:
+            ret = False
+            time.sleep(1)
+            logger.warning(
+                f"{self.sim_code}/environment/{self.step}.json not exist or parses failed, " f"sleep 1s and re-check"
+            )
+        return ret
+
+    async def _react(self) -> Message:
+        # update role env
+        ret = await self.update_role_env()
+        if not ret:
+            # TODO add message
+            logger.info(f"Role: {self.name} update_role_env return False")
+            return DummyMessage()
+
+        new_day = False
+        if not self.scratch.curr_time or self.inner_voice:
+            new_day = "First day"
+        elif self.scratch.curr_time.strftime("%A %B %d") != self.curr_time.strftime("%A %B %d"):
+            new_day = "New day"
+        logger.info(f"Role: {self.name} new_day: {new_day}")
+        self.rc.scratch.curr_time = self.curr_time
+
+        # get maze_env from self.rc.env, and observe env info
+        observed = await self.observe()
+
+        # use self.rc.memory 's retrieve functions
+        retrieved = self.retrieve(observed)
+
+        plans = await plan(self, self.rc.env.get_roles(), new_day, retrieved)
+
+        await self.reflect()
+
+        # feed-back into maze_env
+        next_tile, pronunciatio, description = await self.execute(plans)
+        role_move = {
+            "movement": next_tile,
+            "pronunciatio": pronunciatio,
+            "description": description,
+            "chat": self.scratch.chat,
+        }
+        save_movement(self.name, role_move, step=self.step, sim_code=self.sim_code, curr_time=self.curr_time)
+
+        # step update
+        logger.info(f"Role: {self.name} run at {self.step} step on {self.curr_time} at tile: {self.scratch.curr_tile}")
+        self.step += 1
+        save_environment(self.name, self.step, self.sim_code, next_tile)
+        self.curr_time += timedelta(seconds=self.sec_per_step)
+        self.inner_voice = False
+
+        time.sleep(0.5)
+        return DummyMessage()
+
+
+STRoleContext.model_rebuild()
diff --git a/metagpt/ext/stanford_town/stanford_town.py b/metagpt/ext/stanford_town/stanford_town.py
new file mode 100644
index 0000000000..96f6a4b4ee
--- /dev/null
+++ b/metagpt/ext/stanford_town/stanford_town.py
@@ -0,0 +1,45 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : StanfordTown to works like SoftwareCompany
+
+from typing import Any, Optional
+
+from metagpt.context import Context
+from metagpt.environment import StanfordTownEnv
+from metagpt.ext.stanford_town.roles.st_role import STRole
+from metagpt.ext.stanford_town.utils.const import MAZE_ASSET_PATH
+from metagpt.logs import logger
+from metagpt.team import Team
+
+
+class StanfordTown(Team):
+    env: Optional[StanfordTownEnv] = None
+
+    def __init__(self, context: Context = None, **data: Any):
+        super(Team, self).__init__(**data)
+        ctx = context or Context()
+        if not self.env:
+            self.env = StanfordTownEnv(context=ctx, maze_asset_path=MAZE_ASSET_PATH)
+        else:
+            self.env.context = ctx  # The `env` object is allocated by deserialization
+
+    async def hire(self, roles: list[STRole]):
+        logger.warning(f"The Town add {len(roles)} roles, and start to operate.")
+        super().hire(roles)
+        for role in roles:
+            await role.init_curr_tile()
+
+    async def run(self, n_round: int = 3):
+        """Run company until target round or no money"""
+        while n_round > 0:
+            n_round -= 1
+            logger.debug(f"{n_round=}")
+            self._check_balance()
+            await self.env.run()
+
+        # save simulation result including environment and roles after all rounds
+        roles = self.env.get_roles()
+        for profile, role in roles.items():
+            role.save_into()
+
+        return self.env.history
diff --git a/metagpt/ext/stanford_town/static_dirs/assets/the_ville/agent_history_init_n25.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/agent_history_init_n25.csv
new file mode 100644
index 0000000000..6f36e91ba4
--- /dev/null
+++ b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/agent_history_init_n25.csv
@@ -0,0 +1,26 @@
+Name,Whisper
+Latoya Williams,"Rajiv Patel is your housemate whom you've known for about a year; You and Rajiv Patel sometimes talk about politics and local elections; Abigail Chan is your housemate whom you've known for about a year; Francisco Lopez is your housemate whom you've known for about a year; Haily Johnson is your housemate whom you've known for about a year but you don't really find her too comfortable; In terms of your daily plans, you sometimes spend time at The Rose and Crown Pub when it's late; You have known the bartender at The Rose and Crown Pub, Arthur Burton for about half a year; You like to talk about politics and local elections"
+Rajiv Patel,"Latoya Williams is your housemate whom you've known for about a year; You and Latoya Williams sometimes talk about politics and local elections; Abigail Chan is your housemate whom you've known for about a year and you think she is kind of cute; Francisco Lopez is your housemate whom you've known for about a year; Haily Johnson is your housemate whom you've known for about a year but you don't really find her too comfortable; You sometimes try to spend time at Hobbs Cafe but you haven't really talked to anyone there yet; In terms of your daily plans, you sometimes spend time at The Rose and Crown Pub when it's late and you have known the bartender, Arthur Burton for about a year; You like to talk about politics and local elections"
+Abigail Chen,You think you are kind of cute; You and Latoya Williams are housemates and have known each other for about a year; You and Rajiv Patel are housemates and have known each other for about a year and you two are somewhat close; You and Francisco Lopez are housemates and have known each other for about a year; You and Hailey Johnson are housemates and have known each other for about a year
+Francisco Lopez,"You and Latoya Williams are housemates and have known each other for about a year; You and Rajiv Patel are housemates and have known each other for about a year; You and Abigail Chen are housemates and have known each other for about a year; You and Hailey Johnson are housemates and have known each other for about a year but you don't really like her too much; You have a secret crush on Abigail Chen but so far, you haven't had the courage to ask her out; You think Abigail Chen is cute; You frequent Hobbs Cafe"
+Hailey Johnson,"You want to be acknowledged by everyone; You've known Isabella Rodriguez for about a year and you talk to her often about the piece you are currently writing; Latoya Williams is your housemate whom you've known for about a year and you think she is somewhat cute; Rajiv Patel is your housemate whom you've known for about a year, but you don't know much about him; Abigail Chen is a housemate whom you've known for about a year, but you haven't really talked to her yet; Francisco Lopez is your housemate and you two have known each other for quite awhile because you are from the same town; You are interested in meeting someone; You are interested in romantically dating someone; You are not seeing anyone right now "
+Arthur Burton,"You are generally nice to all your customers and listen to their story; You and Isabella Rodriguez are friends; You've known Isabella Rodriguez for a few years since she runs Hobbs Cafe right next to your bar; You know Latoya Williams as a customer at your bar, The Rose and Crown Pub; You know Rajiv Patel as a customer at your bar, The Rose and Crown Pub; You know Ryan Park as a customer at your bar, The Rose and Crown Pub; You know Carlos Gomez as a customer at your bar, The Rose and Crown Pub; You know Adam Smith as a customer at your bar, The Rose and Crown Pub; You know Yuriko Yamamoto as a customer at your bar, The Rose and Crown Pub; You know Jennifer Moore as a customer at your bar, The Rose and Crown Pub; You know Sam Moore as a customer at your bar, The Rose and Crown Pub; You know Carmen Ortiz as a customer at your bar, The Rose and Crown Pub; You know Tom Moreno as a customer at your bar, The Rose and Crown Pub; You don't like it when people fight at your bar"
+Ryan Park,"You frequent Hobbs Cafe to work and think and eat; You've known Isabella Rodriguez for about a year; You know Isabella Rodriguez works at Hobbs Cafe; You frequent The Rose and Crown Pub to eat dinner; You've known the bartender at The Rose and Crown Pub, Arthur Burton, for about a year; You've known Giorgio Rossi, your next door neighbor, for about a year; You've known Carlos Gomez, your neighbor, for about a year; You wonder why Giorgio Rossi and Carlos Gomez are always fighting; You want no part in Giorgio Rossi and Carlos Gomez's fight"
+Isabella Rodriguez,"You are excited to be planning a Valentine's Day party at *Hobbs Cafe on February 14th from 5pm* and you are eager to tell everyone to come to the party; You and Maria Lopez have known each other for about a year ever since Maria Lopez visited Hobbs Cafe and are good friends; Maria Lopez is a loyal friend to you and a frequent customer at Hobbs Cafe;  You see Tamara Taylor as a frequent customer at your cafe, Hobbs Cafe; You and Tamara Taylor have known each other for a few months; You and Carlos Gomez have known each other for about 4 years; You know that Carlos Gomez is a good poet and you like his poem; You see Ryan Park frequently when he visits your cafe, Hobbs Cafe; You often see Ryan Park working hard on his laptop and you think he is dedicated in his work, which you find to be cool; Hailey Johnson is a frequent customer at your cafe, Hobbs Cafe; You find Haily Johnson to be a little uncomfortable because she is too pushy; You know Giorgio Rossi as a customer at your Hobbs Cafe; You know Wolfgang Schulz as a customer at Hobbs Cafe; You know Carmen Ortiz as a customer at Hobbs Cafe; You and Arthur Burton are friends; You've known Arthur Burton for a few years since he runs a bar right next door"
+Giorgio Rossi,"You do not like Carlos Gomez; You think Carlos Gomez is annoying; You think Carlos Gomez is pushy; You think Carlos Gomez is a coward; You've known Carlos Gomez, your next door neighbor, for about two years; You think Carlos Gomez is really loud and you have filed complaints against him before; For planning, you frequent Hobbs Cafe to hang out and write and think; you are friends with Isabella Rodriguez who works at Hobbs Cafe; You think Isabella Rodriguez is kind-hearted; You and Ryan Park sometimes talk about random things; You've known Ryan Park for about a year living as his neighbor; You would rather not see Carlos Gomez ever"
+Carlos Gomez,"You do not like Giorgio Rossi; You think Giorgio Rossi is annoying; You think Giorgio Rossi is a coward; You've known Giorgio Rossi, your next door neighbor, for about two years; For planning, you frequent The Rose and Crown Pub at night to eat and drink; you are friends with Arthur Burton who is a bartender at the pub; You've known Ryan Park for about a year living as his neighbor; You would rather not see Giorgio Rossi ever; You want Ryan Park to take your side in his fight against Giorgio Rossi"
+Klaus Mueller,"This is very important -- you have a crush on Maria Lopez; You and Maria Lopez have known each other for over 2 years now; You and Maria Lopez are close friends and classmates; You are close with Ayesha Khan, who is a classmate in one of your classes and a dormmate; You and Maria Lopez are dormmates; You and Eddy Lin are classmates; You know Mei Lin is a professor at your college; You and Wolfgang Schulz are classmates and dormmates"
+Maria Lopez,"This is very important -- you have a secret crush on Klaus Mueller; You and Klaus Mueller have known each other for over 2 years now; You and Klaus Mueller are close friends and classmates; For planning, you frequent Hobbs Cafe for studying; You are close with Ayesha Khan, who is a classmate in one of your classes and a dormmate; You and Eddy Lin are classmates; You know Mei Lin is a professor at your college; You and Wolfgang Schulz are classmates and dormmates"
+Ayesha Khan,"You are close with Wolfgang Schulz, who is a classmate in one of your classes and a dormmate; You and Maria Lopez are dormmates; You and Klaus Mueller are dormmates; You and Eddy Lin are classmates; You know Mei Lin is a professor at your college"
+Wolfgang Schulz,"For planning, you frequent Hobbs Cafe for studying; You are close with Ayesha Khan, who is a classmate in one of your classes and a dormmate; You and Maria Lopez are dormmates; You and Klaus Mueller are dormmates; You and Eddy Lin are classmates and you two sometimes talk about your favorite music; You know Mei Lin is a professor at your college; You've met Isabella Rodriguez who works at the cafe but have not really talked to her"
+Mei Lin,"You are a professor who loves teaching; You've known your neighbor, Yuriko Yamamoto, since the time she helped you with some legal matters; You've known your next door old couple, Sam Moore and Jennifer Moore, for a few years; You think Sam Moore is a kind and nice man; You like Jennifer Moore's art; You know of Tamara Taylor who live next block but you haven't really chatted with her; You've known Carmen Ortiz for a year or so as your neighbor; You know the Moreno family somewhat well -- the husband Tom Moreno and the wife Jane Moreno; You know that Tom Moreno and your husband, John Lin, are colleagues at The Willows Market and Pharmacy; John Lin is your husband who works at the Pharmacy section of The Willows Market and Pharmacy; Eddy Lin is your son who studies music theory at the college; You love your family very much; You think your son, Eddy Lin, has been a little rebellious recently"
+John Lin,"You like to talk about politics and local elections; You are really curious about who will run for the local mayor election that is coming up in a few months; You've known your neighbor, Yuriko Yamamoto, since the time she helped you with some legal matters; You've known your next door old couple, Sam Moore and Jennifer Moore, for a few years; You think Sam Moore is a kind and nice man; You like Jennifer Moore's art; You know of Tamara Taylor who live next block but you haven't really chatted with her; You've known Carmen Ortiz for a year or so as your neighbor; You and Tom Moreno are colleagues at The Willows Market and Pharmacy; You know the Moreno family somewhat well -- the husband Tom Moreno and the wife Jane Moreno; Mei Lin is your wife who is a professor; Eddy Lin is your son who studies music theory at the college; You love your family very much"
+Eddy Lin,"You are a music student at the Oak Hill College; You are working on a new music composition; You like hip hop music; You like to attach ""Yo"" at the end of your sentences; You've known your neighbor, Yuriko Yamamoto, for a few years since she helped your parents with some legal matters; You've known your next door old couple, Sam Moore and Jennifer Moore, for a few years; You know of Tamara Taylor who live next block but you haven't really chatted with her; You've known Carmen Ortiz for a year or so as your neighbor; You know the Moreno family somewhat well -- the husband Tom Moreno and the wife Jane Moreno; You know that Tom Moreno and your father, John Lin, are colleagues at The Willows Market and Pharmacy; John Lin is your father who works at the Pharmacy section of The Willows Market and Pharmacy; Mei Lin is your mother who teaches at the Oak Hill Collrhr; You love your family very much; You think your mother, Mei Lin, is a little too uptight; You and Wolfgang Schulz are schoolmates; You and Ayesha Khan are school mates; You and Maria Lopez are schoolmates"
+Tom Moreno,"You like to express your opinions; You are loud; You like to talk about politics and local elections; You've known your neighbor, Yuriko Yamamoto, for a few years and you two sometimes chat about the local election; You've known your next door old couple, Sam Moore and Jennifer Moore, for a few years; You don't really like Sam Moore; You know of Tamara Taylor who live next block but you haven't really chatted with her; You've known Carmen Ortiz for a year or so as your neighbor; In terms of your daily plans, you frequent The Rose and Crown Pub at night; You've knonw the bartender Arthur Burton for a few years; You sometimes talk to Adam Smith about local elections; You and John Lin are colleagues at The Willows Market and Pharmacy; You know the Lin family somewhat well -- the husband John Lin, wife, Mei Lin, and the son Eddy Lin; you know Mei Lin is a professor; Jane Moreno is your wife -- you love her but your relationship with her has been strained recently"
+Jane Moreno,"You don't really care about politics; You've known your neighbor, Yuriko Yamamoto, for a few years; You've known your next door old couple, Sam Moore and Jennifer Moore, for a few years; You think Sam Moore is a kind and nice man; You know of Tamara Taylor who live next block but you haven't really chatted with her; You've known Carmen Ortiz for a year or so as your neighbor; You know the Lin family somewhat well since they are your neighbor -- the husband John Lin, wife, Mei Lin, and the son Eddy Lin; you know Mei Lin is a professor; Tom Moreno is your husband -- you love him but your relationship with him has been strained recently"
+Tamara Taylor,"You just moved in; Carmen Ortiz is your housemate; You don't really know any one in town because you justn moved in, but you are looking forward to meeting more people"
+Carmen Ortiz,"You are somehwat curious about who will run for the local mayor election that is coming up in a few months; Tamara Taylor is your housemate who just moved in; Tamara Taylor just moved in so she doesn't know many peopl in town; You've known your neighbor, Yuriko Yamamoto, for a few years and you two sometimes chat about the local election; You've known your next door old couple, Sam Moore and Jennifer Moore, for a few years; You've known the couple, Tom Moreno and Jane Moreno, who live in the next block for a few years; In terms of your daily plans, you frequent Hobbs Cafe; You've knonw the bartender Arthur Burton for a few years; You've known Isabella Rodriguez the owner at Hobbs Cafe for a few years"
+Sam Moore,"You are thinking of running in the upcoming local mayor election; You are telling people that you are running for the upcoming local mayor election; You've known your neighbor, Adam Smith, for a few years; You consider Adam Smith to be a very close friend of yours although he is much younger than you; You've known your neighbor, Yuriko Yamamoto, for a few years since the time she helped you and your wife Jennifer Moore on some legal matters; You consider Yuriko Yamamoto to be someone like your daughter even though you two are not related; You've known Carmen Ortiz for a year or so as your neighbor; You've known the couple, Tom Moreno and Jane Moreno, who live in the next block for a few years; You think Tom Moreno is a little too aggressive and opinionated; You've known the bartender Arthur Burton for a few years; You've known the Lin family, Mei, John, and the son Eddy Lin, for a few years since they live next block; In terms of your plan, you like to take a walk in the park;"
+Jennifer Moore,"You don't really care about politics; You've known your neighbor, Adam Smith, for a few years; You've known your neighbor, Yuriko Yamamoto, for a few years since the time she helped you and your husband Sam Moore on some legal matters; You consider Yuriko Yamamoto to be someone like your daughter even though you two are not related; You've known Carmen Ortiz for a year or so as your neighbor; You've known the couple, Tom Moreno and Jane Moreno, who live in the next block for a few years; You think Tom Moreno is a little too aggressive and opinionated; You've known the bartender Arthur Burton for a few years; You've known the Lin family, Mei, John, and the son Eddy Lin, for a few years since they live next block; You love your husband, Sam Moore and hope he has relaxing days; You know Sam Moore, your husband, is planning on running for the local mayor election but you do not want him to as it will be too taxing for him "
+Yuriko Yamamoto,"You like to talk about politics and local elections; You've known your neighbor, Adam Smith, for a few years and you two sometimes chat about the local election; You've known your next door old couple, Sam Moore and Jennifer Moore, for a few years; You and Sam Moore are somewhat close; You've known Carmen Ortiz for a year or so as your neighbor; You've known the couple, Tom Moreno and Jane Moreno, who live in the next block for a few years; You think Tom Moreno is a little too aggressive and opinionated; You've knonw the bartender Arthur Burton for a few years; You've known the Lin family, Mei, John, and the son Eddy Lin, for a few years since the time you helped them with some legal matter"
+Adam Smith,"You like to talk about politics and local elections; You are really curious about who will run for the local mayor election that is coming up in a few months; You've known your neighbor, Yuriko Yamamoto, for a few years and you two sometimes chat about the local election; You've known your next door old couple, Sam Moore and Jennifer Moore, for a few years; You and Sam Moore are somewhat close; You view Sam Moore as something of a mentor; You know of Tamara Taylor who live next block but you haven't really chatted with her; You've known Carmen Ortiz for a year or so as your neighbor; You've known the couple, Tom Moreno and Jane Moreno, who live in the next block for a few years; You think Tom Moreno is a little too aggressive and opinionated; In terms of your daily plans, you frequent The Rose and Crown Pub at night; You've knonw the bartender Arthur Burton for a few years"
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/static_dirs/assets/the_ville/agent_history_init_n3.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/agent_history_init_n3.csv
new file mode 100644
index 0000000000..04e6c933fb
--- /dev/null
+++ b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/agent_history_init_n3.csv
@@ -0,0 +1,4 @@
+Name,Whisper
+Maria Lopez,This is very important -- you have a secret crush on Klaus Mueller; You and Klaus Mueller have known each other for over 2 years now; You and Klaus Mueller are close friends and classmates; You and Isabella Rodriguez who works at Hobbs Cafe are close friends; For planning, you frequent Hobbs Cafe for studying
+Klaus Mueller,This is very important -- you have a crush on Maria Lopez; You and Maria Lopez have known each other for over 2 years now; You and Maria Lopez are close friends and classmates; You and Maria Lopez are dormmates; You and Isabella Rodriguez are aquintances since Isabella works at Hobbs Cafe that you frequent
+Isabella Rodriguez,You are excited to be planning a Valentine's Day party at *Hobbs Cafe on February 14th from 5pm* and you are eager to tell everyone to come to the party; You and Maria Lopez have known each other for about a year ever since Maria Lopez visited Hobbs Cafe and are good friends; Maria Lopez is a loyal friend to you and a frequent customer at Hobbs Cafe; Klaus Mueller is a frequent customer at Hobbs Cafe; you love your work at Hobbs Cafe
\ No newline at end of file
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/maze/arena_maze.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze/arena_maze.csv
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/maze/arena_maze.csv
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze/arena_maze.csv
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/maze/collision_maze.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze/collision_maze.csv
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/maze/collision_maze.csv
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze/collision_maze.csv
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/maze/game_object_maze.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze/game_object_maze.csv
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/maze/game_object_maze.csv
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze/game_object_maze.csv
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/maze/sector_maze.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze/sector_maze.csv
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/maze/sector_maze.csv
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze/sector_maze.csv
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/maze/spawning_location_maze.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze/spawning_location_maze.csv
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/maze/spawning_location_maze.csv
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze/spawning_location_maze.csv
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/maze_meta_info.json b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze_meta_info.json
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/maze_meta_info.json
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze_meta_info.json
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/special_blocks/arena_blocks.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/special_blocks/arena_blocks.csv
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/special_blocks/arena_blocks.csv
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/special_blocks/arena_blocks.csv
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/special_blocks/game_object_blocks.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/special_blocks/game_object_blocks.csv
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/special_blocks/game_object_blocks.csv
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/special_blocks/game_object_blocks.csv
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/special_blocks/sector_blocks.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/special_blocks/sector_blocks.csv
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/special_blocks/sector_blocks.csv
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/special_blocks/sector_blocks.csv
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/special_blocks/spawning_location_blocks.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/special_blocks/spawning_location_blocks.csv
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/special_blocks/spawning_location_blocks.csv
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/special_blocks/spawning_location_blocks.csv
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/special_blocks/world_blocks.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/special_blocks/world_blocks.csv
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/special_blocks/world_blocks.csv
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/special_blocks/world_blocks.csv
diff --git a/metagpt/ext/stanford_town/utils/__init__.py b/metagpt/ext/stanford_town/utils/__init__.py
new file mode 100644
index 0000000000..2bcf8efd09
--- /dev/null
+++ b/metagpt/ext/stanford_town/utils/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/metagpt/ext/stanford_town/utils/const.py b/metagpt/ext/stanford_town/utils/const.py
new file mode 100644
index 0000000000..7a5c6fd241
--- /dev/null
+++ b/metagpt/ext/stanford_town/utils/const.py
@@ -0,0 +1,15 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
+
+from pathlib import Path
+
+from metagpt.const import EXAMPLE_PATH
+
+ST_ROOT_PATH = Path(__file__).parent.parent
+STORAGE_PATH = EXAMPLE_PATH.joinpath("stanford_town/storage")
+TEMP_STORAGE_PATH = EXAMPLE_PATH.joinpath("stanford_town/temp_storage")
+MAZE_ASSET_PATH = ST_ROOT_PATH.joinpath("static_dirs/assets/the_ville")
+PROMPTS_DIR = ST_ROOT_PATH.joinpath("prompts")
+
+collision_block_id = "32125"
diff --git a/metagpt/ext/stanford_town/utils/mg_ga_transform.py b/metagpt/ext/stanford_town/utils/mg_ga_transform.py
new file mode 100644
index 0000000000..e0de76a6b1
--- /dev/null
+++ b/metagpt/ext/stanford_town/utils/mg_ga_transform.py
@@ -0,0 +1,65 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : data transform of mg <-> ga under storage
+
+from pathlib import Path
+from typing import Optional
+
+from metagpt.ext.stanford_town.utils.const import STORAGE_PATH, TEMP_STORAGE_PATH
+from metagpt.logs import logger
+from metagpt.utils.common import read_json_file, write_json_file
+
+
+def get_reverie_meta(sim_code: str) -> dict:
+    meta_file_path = STORAGE_PATH.joinpath(sim_code).joinpath("reverie/meta.json")
+    reverie_meta = read_json_file(meta_file_path)
+    return reverie_meta
+
+
+def save_movement(role_name: str, role_move: dict, step: int, sim_code: str, curr_time: str):
+    movement_path = STORAGE_PATH.joinpath(f"{sim_code}/movement/{step}.json")
+    if not movement_path.parent.exists():
+        movement_path.parent.mkdir(exist_ok=True)
+    if movement_path.exists():
+        movement = read_json_file(movement_path)
+    else:
+        movement = {"persona": dict(), "meta": dict()}
+    movement["persona"][role_name] = role_move
+    movement["meta"]["curr_time"] = curr_time.strftime("%B %d, %Y, %H:%M:%S")
+
+    write_json_file(movement_path, movement)
+    logger.info(f"save_movement at step: {step}, curr_time: {movement['meta']['curr_time']}")
+
+
+def save_environment(role_name: str, step: int, sim_code: str, movement: list[int]):
+    environment_path = STORAGE_PATH.joinpath(f"{sim_code}/environment/{step}.json")
+    if not environment_path.parent.exists():
+        environment_path.parent.mkdir(exist_ok=True)
+    if environment_path.exists():
+        environment = read_json_file(environment_path)
+    else:
+        environment = {}
+
+    environment[role_name] = {"maze": "the_ville", "x": movement[0], "y": movement[1]}
+    write_json_file(environment_path, environment)
+    logger.info(f"save_environment at step: {step}")
+
+
+def get_role_environment(sim_code: str, role_name: str, step: int = 0) -> dict:
+    env_path = STORAGE_PATH.joinpath(f"{sim_code}/environment/{step}.json")
+    role_env = None
+    if env_path.exists():
+        env_info = read_json_file(env_path)
+        role_env = env_info.get(role_name, None)
+
+    return role_env
+
+
+def write_curr_sim_code(curr_sim_code: dict, temp_storage_path: Optional[Path] = None):
+    temp_storage_path = Path(temp_storage_path) or TEMP_STORAGE_PATH
+    write_json_file(temp_storage_path.joinpath("curr_sim_code.json"), curr_sim_code)
+
+
+def write_curr_step(curr_step: dict, temp_storage_path: Optional[Path] = None):
+    temp_storage_path = Path(temp_storage_path) or TEMP_STORAGE_PATH
+    write_json_file(temp_storage_path.joinpath("curr_step.json"), curr_step)
diff --git a/metagpt/ext/stanford_town/utils/utils.py b/metagpt/ext/stanford_town/utils/utils.py
new file mode 100644
index 0000000000..4e81298c92
--- /dev/null
+++ b/metagpt/ext/stanford_town/utils/utils.py
@@ -0,0 +1,227 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : utils
+
+import csv
+import errno
+import json
+import os
+import shutil
+import time
+from pathlib import Path
+from typing import Union
+
+from openai import OpenAI
+
+from metagpt.config2 import config
+from metagpt.logs import logger
+
+
+def read_csv_to_list(curr_file: str, header=False, strip_trail=True):
+    """
+    Reads in a csv file to a list of list. If header is True, it returns a
+    tuple with (header row, all rows)
+    ARGS:
+      curr_file: path to the current csv file.
+    RETURNS:
+      List of list where the component lists are the rows of the file.
+    """
+    logger.debug(f"start read csv: {curr_file}")
+    if not header:
+        analysis_list = []
+        with open(curr_file) as f_analysis_file:
+            data_reader = csv.reader(f_analysis_file, delimiter=",")
+            for count, row in enumerate(data_reader):
+                if strip_trail:
+                    row = [i.strip() for i in row]
+                analysis_list += [row]
+        return analysis_list
+    else:
+        analysis_list = []
+        with open(curr_file) as f_analysis_file:
+            data_reader = csv.reader(f_analysis_file, delimiter=",")
+            for count, row in enumerate(data_reader):
+                if strip_trail:
+                    row = [i.strip() for i in row]
+                analysis_list += [row]
+        return analysis_list[0], analysis_list[1:]
+
+
+def get_embedding(text, model: str = "text-embedding-ada-002"):
+    text = text.replace("\n", " ")
+    embedding = None
+    if not text:
+        text = "this is blank"
+    for idx in range(3):
+        try:
+            embedding = (
+                OpenAI(api_key=config.llm.api_key).embeddings.create(input=[text], model=model).data[0].embedding
+            )
+        except Exception as exp:
+            logger.info(f"get_embedding failed, exp: {exp}, will retry.")
+            time.sleep(5)
+    if not embedding:
+        raise ValueError("get_embedding failed")
+    return embedding
+
+
+def extract_first_json_dict(data_str: str) -> Union[None, dict]:
+    # Find the first occurrence of a JSON object within the string
+    start_idx = data_str.find("{")
+    end_idx = data_str.find("}", start_idx) + 1
+
+    # Check if both start and end indices were found
+    if start_idx == -1 or end_idx == 0:
+        return None
+
+    # Extract the first JSON dictionary
+    json_str = data_str[start_idx:end_idx]
+
+    try:
+        # Attempt to parse the JSON data
+        json_dict = json.loads(json_str)
+        return json_dict
+    except json.JSONDecodeError:
+        # If parsing fails, return None
+        return None
+
+
+def path_finder_v2(a, start, end, collision_block_char) -> list[int]:
+    def make_step(m, k):
+        for i in range(len(m)):
+            for j in range(len(m[i])):
+                if m[i][j] == k:
+                    if i > 0 and m[i - 1][j] == 0 and a[i - 1][j] == 0:
+                        m[i - 1][j] = k + 1
+                    if j > 0 and m[i][j - 1] == 0 and a[i][j - 1] == 0:
+                        m[i][j - 1] = k + 1
+                    if i < len(m) - 1 and m[i + 1][j] == 0 and a[i + 1][j] == 0:
+                        m[i + 1][j] = k + 1
+                    if j < len(m[i]) - 1 and m[i][j + 1] == 0 and a[i][j + 1] == 0:
+                        m[i][j + 1] = k + 1
+
+    new_maze = []
+    for row in a:
+        new_row = []
+        for j in row:
+            if j == collision_block_char:
+                new_row += [1]
+            else:
+                new_row += [0]
+        new_maze += [new_row]
+    a = new_maze
+
+    m = []
+    for i in range(len(a)):
+        m.append([])
+        for j in range(len(a[i])):
+            m[-1].append(0)
+    i, j = start
+    m[i][j] = 1
+
+    k = 0
+    except_handle = 150
+    while m[end[0]][end[1]] == 0:
+        k += 1
+        make_step(m, k)
+
+        if except_handle == 0:
+            break
+        except_handle -= 1
+
+    i, j = end
+    k = m[i][j]
+    the_path = [(i, j)]
+    while k > 1:
+        if i > 0 and m[i - 1][j] == k - 1:
+            i, j = i - 1, j
+            the_path.append((i, j))
+            k -= 1
+        elif j > 0 and m[i][j - 1] == k - 1:
+            i, j = i, j - 1
+            the_path.append((i, j))
+            k -= 1
+        elif i < len(m) - 1 and m[i + 1][j] == k - 1:
+            i, j = i + 1, j
+            the_path.append((i, j))
+            k -= 1
+        elif j < len(m[i]) - 1 and m[i][j + 1] == k - 1:
+            i, j = i, j + 1
+            the_path.append((i, j))
+            k -= 1
+
+    the_path.reverse()
+    return the_path
+
+
+def path_finder(collision_maze: list, start: list[int], end: list[int], collision_block_char: str) -> list[int]:
+    # EMERGENCY PATCH
+    start = (start[1], start[0])
+    end = (end[1], end[0])
+    # END EMERGENCY PATCH
+
+    path = path_finder_v2(collision_maze, start, end, collision_block_char)
+
+    new_path = []
+    for i in path:
+        new_path += [(i[1], i[0])]
+    path = new_path
+
+    return path
+
+
+def create_folder_if_not_there(curr_path):
+    """
+    Checks if a folder in the curr_path exists. If it does not exist, creates
+    the folder.
+    Note that if the curr_path designates a file location, it will operate on
+    the folder that contains the file. But the function also works even if the
+    path designates to just a folder.
+    Args:
+        curr_list: list to write. The list comes in the following form:
+                   [['key1', 'val1-1', 'val1-2'...],
+                    ['key2', 'val2-1', 'val2-2'...],]
+        outfile: name of the csv file to write
+    RETURNS:
+        True: if a new folder is created
+        False: if a new folder is not created
+    """
+    outfolder_name = curr_path.split("/")
+    if len(outfolder_name) != 1:
+        # This checks if the curr path is a file or a folder.
+        if "." in outfolder_name[-1]:
+            outfolder_name = outfolder_name[:-1]
+
+        outfolder_name = "/".join(outfolder_name)
+        if not os.path.exists(outfolder_name):
+            os.makedirs(outfolder_name)
+            return True
+
+    return False
+
+
+def find_filenames(path_to_dir, suffix=".csv"):
+    """
+    Given a directory, find all files that end with the provided suffix and
+    return their paths.
+    ARGS:
+        path_to_dir: Path to the current directory
+        suffix: The target suffix.
+    RETURNS:
+        A list of paths to all files in the directory.
+    """
+    filenames = os.listdir(path_to_dir)
+    return [path_to_dir + "/" + filename for filename in filenames if filename.endswith(suffix)]
+
+
+def copy_folder(src_folder: str, dest_folder: str):
+    try:
+        if Path(dest_folder).exists():
+            logger.warning(f"{dest_folder} exist, start to remove.")
+            shutil.rmtree(dest_folder)
+        shutil.copytree(src_folder, dest_folder)
+    except OSError as exc:  # python >2.5
+        if exc.errno in (errno.ENOTDIR, errno.EINVAL):
+            shutil.copy(src_folder, dest_folder)
+        else:
+            raise
diff --git a/metagpt/ext/werewolf/__init__.py b/metagpt/ext/werewolf/__init__.py
new file mode 100644
index 0000000000..2bcf8efd09
--- /dev/null
+++ b/metagpt/ext/werewolf/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/metagpt/ext/werewolf/actions/__init__.py b/metagpt/ext/werewolf/actions/__init__.py
new file mode 100644
index 0000000000..c994c43c89
--- /dev/null
+++ b/metagpt/ext/werewolf/actions/__init__.py
@@ -0,0 +1,23 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
+
+from metagpt.ext.werewolf.actions.werewolf_actions import Hunt, Impersonate
+from metagpt.ext.werewolf.actions.guard_actions import Protect
+from metagpt.ext.werewolf.actions.seer_actions import Verify
+from metagpt.ext.werewolf.actions.witch_actions import Save, Poison
+from metagpt.ext.werewolf.actions.common_actions import Speak, NighttimeWhispers, Reflect
+from metagpt.ext.werewolf.actions.experience_operation import AddNewExperiences, RetrieveExperiences
+from metagpt.ext.werewolf.actions.moderator_actions import InstructSpeak
+
+ACTIONS = {
+    "Speak": Speak,
+    "Hunt": Hunt,
+    "Protect": Protect,
+    "Verify": Verify,
+    "Save": Save,
+    "Poison": Poison,
+    "Impersonate": Impersonate,
+}
+
+__all__ = ["NighttimeWhispers", "Reflect", "AddNewExperiences", "RetrieveExperiences", "InstructSpeak"]
diff --git a/metagpt/ext/werewolf/actions/common_actions.py b/metagpt/ext/werewolf/actions/common_actions.py
new file mode 100644
index 0000000000..63afeede0e
--- /dev/null
+++ b/metagpt/ext/werewolf/actions/common_actions.py
@@ -0,0 +1,240 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
+
+import json
+
+from tenacity import retry, stop_after_attempt, wait_fixed
+
+from metagpt.actions import Action
+from metagpt.logs import logger
+from metagpt.utils.common import parse_json_code_block
+
+
+def log_and_parse_json(name: str, rsp: str) -> dict:
+    rsp = rsp.replace("\n", " ")
+    logger.debug(f"{name} result: {rsp}")
+    json_blocks = parse_json_code_block(rsp)
+    rsp_json = json.loads(json_blocks[0])
+    return rsp_json
+
+
+class Speak(Action):
+    """Action: Any speak action in a game"""
+
+    PROMPT_TEMPLATE: str = """
+    {
+    "BACKGROUND": "It's a Werewolf game, in this game, we have 2 werewolves, 2 villagers, 1 guard, 1 witch, 1 seer. You are __profile__. Note that villager, seer, guard and witch are all in villager side, they have the same objective. Werewolves can collectively hunt ONE player at night."
+    ,"HISTORY": "You have knowledge to the following conversation: __context__"
+    ,"ATTENTION": "You can NOT VOTE a player who is NOT ALIVE now!"
+    ,"REFLECTION": "__reflection__"
+    ,"STRATEGY": __strategy__
+    ,"PAST_EXPERIENCES": "__experiences__"
+    ,"MODERATOR_INSTRUCTION": __latest_instruction__,
+    ,"RULE": "Please follow the moderator's latest instruction, figure out if you need to speak your opinion or directly to vote:
+              1. If the instruction is to SPEAK, speak in 200 words. Remember the goal of your role and try to achieve it using your speech;
+              2. If the instruction is to VOTE, you MUST vote and ONLY say 'I vote to eliminate PlayerX', replace PlayerX with the actual player name, DO NOT include any other words."
+    ,"OUTPUT_FORMAT":
+        {
+        "ROLE": "Your role, in this case, __profile__"
+        ,"PLAYER_NAME": "Your name, in this case, __name__"
+        ,"LIVING_PLAYERS": "List living players based on MODERATOR_INSTRUCTION. Return a json LIST datatype."
+        ,"THOUGHTS": "Based on `MODERATOR_INSTRUCTION` and `RULE`, carefully think about what to say or vote so that your chance of win as __profile__ maximizes.
+                      If you find similar situation in `PAST_EXPERIENCES`, you may draw lessons from them to refine your strategy, take better vote action, or improve your speech.
+                      Give your step-by-step thought process, you should think no more than 3 steps. For example: My step-by-step thought process:..."
+        ,"RESPONSE": "Based on `MODERATOR_INSTRUCTION`, `RULE`, and the 'THOUGHTS' you had, express your opinion or cast a vote."
+        }
+    }
+    """
+    STRATEGY: str = """
+    Decide whether to reveal your identity based on benefits vs. risks, provide useful information, and vote to eliminate the most suspicious.
+    If you have special abilities, pay attention to those who falsely claims your role, for they are probably werewolves.
+    """
+
+    name: str = "Speak"
+
+    @retry(stop=stop_after_attempt(2), wait=wait_fixed(1))
+    async def run(
+        self,
+        profile: str,
+        name: str,
+        context: str,
+        latest_instruction: str,
+        reflection: str = "",
+        experiences: str = "",
+    ):
+        prompt = (
+            self.PROMPT_TEMPLATE.replace("__context__", context)
+            .replace("__profile__", profile)
+            .replace("__name__", name)
+            .replace("__latest_instruction__", latest_instruction)
+            .replace("__strategy__", self.STRATEGY)
+            .replace("__reflection__", reflection)
+            .replace("__experiences__", experiences)
+        )
+
+        rsp = await self._aask(prompt)
+        rsp_json = log_and_parse_json(self.name, rsp)
+
+        return rsp_json["RESPONSE"]
+
+
+class NighttimeWhispers(Action):
+    """
+
+    Action: nighttime whispers with thinking processes
+
+    Usage Example:
+
+        class Hunt(NighttimeWhispers):
+            def __init__(self, name="Hunt", context=None, llm=None):
+                super().__init__(name, context, llm)
+
+        class Protect(NighttimeWhispers):
+            def __init__(self, name="Protect", context=None, llm=None):
+                super().__init__(name, context, llm)
+
+        class Verify(NighttimeWhispers):
+            def __init__(self, name="Verify", context=None, llm=None):
+                super().__init__(name, context, llm)
+
+        class Save(NighttimeWhispers):
+            def __init__(self, name="Save", context=None, llm=None):
+                super().__init__(name, context, llm)
+
+            def _update_prompt_json(self, prompt_json: dict, profile: str, name: str, context: str, **kwargs):
+                del prompt_json['ACTION']
+                del prompt_json['ATTENTION']
+                prompt_json["OUTPUT_FORMAT"]["THOUGHTS"] = "It is night time. Return the thinking steps of your decision of whether to save the player JUST be killed at this night."
+                prompt_json["OUTPUT_FORMAT"]["RESPONSE"] = "Follow the Moderator's instruction, decide whether you want to save that person or not. Return SAVE or PASS."
+                return prompt_json
+
+        class Poison(NighttimeWhispers):
+            def __init__(self, name="Poison", context=None, llm=None):
+                super().__init__(name, context, llm)
+
+            def _update_prompt_json(self, prompt_json: dict, profile: str, name: str, context: str, **kwargs):
+                prompt_json["OUTPUT_FORMAT"]["RESPONSE"] += "Or if you want to PASS, return PASS."
+                return prompt_json
+    """
+
+    PROMPT_TEMPLATE: str = """
+    {
+    "BACKGROUND": "It's a Werewolf game, in this game, we have 2 werewolves, 2 villagers, 1 guard, 1 witch, 1 seer. You are __profile__. Note that villager, seer, guard and witch are all in villager side, they have the same objective. Werewolves can collectively hunt ONE player at night."
+    ,"HISTORY": "You have knowledge to the following conversation: __context__"
+    ,"ACTION": "Choose one living player to __action__."
+    ,"ATTENTION": "1. You can only __action__ a player who is alive this night! And you can not __action__ a player who is dead this night!  2. `HISTORY` is all the information you observed, DONT hallucinate other player actions!"
+    ,"REFLECTION": "__reflection__"
+    ,"STRATEGY": "__strategy__"
+    ,"PAST_EXPERIENCES": "__experiences__"
+    ,"OUTPUT_FORMAT":
+        {
+        "ROLE": "Your role, in this case, __profile__"
+        ,"PLAYER_NAME": "Your name, in this case, __name__"
+        ,"LIVING_PLAYERS": "List the players who is alive based on moderator's latest instruction. Return a json LIST datatype."
+        ,"THOUGHTS": "Choose one living player from `LIVING_PLAYERS` to __action__ this night. Return the reason why you choose to __action__ this player. If you observe nothing at first night, DONT imagine unexisting player actions! If you find similar situation in `PAST_EXPERIENCES`, you may draw lessons from them to refine your strategy and take better actions. Give your step-by-step thought process, you should think no more than 3 steps. For example: My step-by-step thought process:..."
+        ,"RESPONSE": "As a __profile__, you should choose one living player from `LIVING_PLAYERS` to __action__ this night according to the THOUGHTS you have just now. Return the player name ONLY."
+        }
+    }
+    """
+    STRATEGY: str = """
+    Decide which player is most threatening to you or most needs your support, take your action correspondingly.
+    """
+
+    name: str = "NightTimeWhispers"
+
+    def _construct_prompt_json(
+        self, role_profile: str, role_name: str, context: str, reflection: str, experiences: str, **kwargs
+    ):
+        prompt_template = self.PROMPT_TEMPLATE
+
+        def replace_string(prompt_json: dict):
+            k: str
+            for k in prompt_json.keys():
+                if isinstance(prompt_json[k], dict):
+                    prompt_json[k] = replace_string(prompt_json[k])
+                    continue
+                prompt_json[k] = prompt_json[k].replace("__profile__", role_profile)
+                prompt_json[k] = prompt_json[k].replace("__name__", role_name)
+                prompt_json[k] = prompt_json[k].replace("__context__", context)
+                prompt_json[k] = prompt_json[k].replace("__action__", self.name)
+                prompt_json[k] = prompt_json[k].replace("__strategy__", self.STRATEGY)
+                prompt_json[k] = prompt_json[k].replace("__reflection__", reflection)
+                prompt_json[k] = prompt_json[k].replace("__experiences__", experiences)
+
+            return prompt_json
+
+        prompt_json: dict = json.loads(prompt_template)
+
+        prompt_json = replace_string(prompt_json)
+
+        prompt_json: dict = self._update_prompt_json(
+            prompt_json, role_profile, role_name, context, reflection, experiences, **kwargs
+        )
+        assert isinstance(prompt_json, dict)
+
+        prompt: str = json.dumps(prompt_json, indent=4, ensure_ascii=False)
+
+        return prompt
+
+    def _update_prompt_json(
+        self, prompt_json: dict, role_profile: str, role_name: str, context: str, reflection: str, experiences: str
+    ) -> dict:
+        # one can modify the prompt_json dictionary here
+        return prompt_json
+
+    @retry(stop=stop_after_attempt(2), wait=wait_fixed(1))
+    async def run(self, context: str, profile: str, name: str, reflection: str = "", experiences: str = ""):
+        prompt = self._construct_prompt_json(
+            role_profile=profile, role_name=name, context=context, reflection=reflection, experiences=experiences
+        )
+
+        rsp = await self._aask(prompt)
+        rsp_json = log_and_parse_json(self.name, rsp)
+
+        return f"{self.name} " + rsp_json["RESPONSE"]
+
+
+class Reflect(Action):
+    PROMPT_TEMPLATE: str = """
+    {
+    "BACKGROUND": "It's a Werewolf game, in this game, we have 2 werewolves, 2 villagers, 1 guard, 1 witch, 1 seer. You are __profile__. Note that villager, seer, guard and witch are all in villager side, they have the same objective. Werewolves can collectively hunt ONE player at night."
+    ,"HISTORY": "You have knowledge to the following conversation: __context__"
+    ,"MODERATOR_INSTRUCTION": __latest_instruction__,
+    ,"OUTPUT_FORMAT" (a json):
+        {
+        "ROLE": "Your role, in this case, __profile__"
+        ,"PLAYER_NAME": "Your name, in this case, __name__"
+        "GAME_STATES": "You are about to follow `MODERATOR_INSTRUCTION`, but before taking any action, analyze each player, including the living and the dead, and summarize the game states.
+                        For each player, your reflection should be a ONE-LINE json covering the following dimension, return a LIST of jsons (return an empty LIST for the first night):
+                        [
+                            {"TARGET": "the player you will analyze, if the player is yourself or your werewolf partner, indicate it" ,"STATUS": "living or dead, if dead, how was he/she possibly killed?", "CLAIMED_ROLE": "claims a role or not, if so, what role, any contradiction to others? If there is no claim, return 'None'", "SIDE_WITH": "sides with which players? If none, return 'None'", "ACCUSE": "accuses which players? If none, return 'None'"}
+                            ,{...}
+                            ,...
+                        ]"
+        ,"REFLECTION": "Based on the whole `GAME_STATES`, return a json (return an empty string for the first night):
+                       {
+                            "Player1": "the true role (werewolf / special role / villager, living or dead) you infer about him/her, and why is this role? If the player is yourself or your werewolf partner, indicate it."
+                            ,...
+                            ,"Player7": "the true role (werewolf / special role / villager, living or dead) you infer about him/her, and why is this role? If the player is yourself or your werewolf partner, indicate it."
+                            ,"GAME_STATE_SUMMARIZATION": "summarize the current situation from your standpoint in one sentence, your summarization should catch the most important information from your reflection, such as conflicts, number of living werewolves, special roles, and villagers."
+                       }"
+        }
+    }
+    """
+
+    name: str = "Reflect"
+
+    @retry(stop=stop_after_attempt(2), wait=wait_fixed(1))
+    async def run(self, profile: str, name: str, context: str, latest_instruction: str):
+        prompt = (
+            self.PROMPT_TEMPLATE.replace("__context__", context)
+            .replace("__profile__", profile)
+            .replace("__name__", name)
+            .replace("__latest_instruction__", latest_instruction)
+        )
+
+        rsp = await self._aask(prompt)
+        rsp_json = log_and_parse_json(self.name, rsp)
+
+        return json.dumps(rsp_json["REFLECTION"])
diff --git a/metagpt/ext/werewolf/actions/experience_operation.py b/metagpt/ext/werewolf/actions/experience_operation.py
new file mode 100644
index 0000000000..1f2e491d69
--- /dev/null
+++ b/metagpt/ext/werewolf/actions/experience_operation.py
@@ -0,0 +1,162 @@
+import json
+from typing import Optional
+
+import chromadb
+from pydantic import model_validator
+
+from metagpt.actions import Action
+from metagpt.const import DEFAULT_WORKSPACE_ROOT
+from metagpt.environment.werewolf.const import RoleType
+from metagpt.ext.werewolf.schema import RoleExperience
+from metagpt.logs import logger
+from metagpt.rag.engines.simple import SimpleEngine
+from metagpt.rag.schema import ChromaIndexConfig, ChromaRetrieverConfig
+from metagpt.utils.common import read_json_file, write_json_file
+
+DEFAULT_COLLECTION_NAME = "role_reflection"  # FIXME: some hard code for now
+PERSIST_PATH = DEFAULT_WORKSPACE_ROOT.joinpath("werewolf_game/chroma")
+PERSIST_PATH.mkdir(parents=True, exist_ok=True)
+
+
+class AddNewExperiences(Action):
+    name: str = "AddNewExperience"
+    collection_name: str = DEFAULT_COLLECTION_NAME
+    delete_existing: bool = False
+    engine: Optional[SimpleEngine] = None
+
+    @model_validator(mode="after")
+    def validate_collection(self):
+        if self.engine:
+            return
+        if self.delete_existing:
+            try:
+                # implement engine `DELETE` method later
+                chromadb.PersistentClient(PERSIST_PATH.as_posix()).delete_collection(self.collection_name)
+            except Exception as exp:
+                logger.error(f"delete chroma collection: {self.collection_name} failed, exp: {exp}")
+
+        self.engine = SimpleEngine.from_objs(
+            retriever_configs=[
+                ChromaRetrieverConfig(
+                    persist_path=PERSIST_PATH, collection_name=self.collection_name, metadata={"hnsw:space": "cosine"}
+                )
+            ]
+        )
+
+    def run(self, experiences: list[RoleExperience]):
+        if not experiences:
+            return
+        for i, exp in enumerate(experiences):
+            exp.id = f"{exp.profile}-{exp.name}-step{i}-round_{exp.round_id}"
+
+        AddNewExperiences._record_experiences_local(experiences)
+
+        self.engine.add_objs(experiences)
+
+    def add_from_file(self, file_path):
+        experiences = read_json_file(file_path)
+        experiences = [RoleExperience.model_validate(item) for item in experiences]
+        experiences = [exp for exp in experiences if len(exp.reflection) > 2]  # not "" or not '""'
+
+        self.engine.add_objs(experiences)
+
+    @staticmethod
+    def _record_experiences_local(experiences: list[RoleExperience]):
+        round_id = experiences[0].round_id
+        version = experiences[0].version
+        version = "test" if not version else version
+        experiences = [exp.model_dump() for exp in experiences]
+
+        experience_path = DEFAULT_WORKSPACE_ROOT.joinpath(f"werewolf_game/experiences/{version}")
+        experience_path.mkdir(parents=True, exist_ok=True)
+        save_path = f"{experience_path}/{round_id}.json"
+        write_json_file(save_path, experiences)
+        logger.info(f"experiences saved to {save_path}")
+
+
+class RetrieveExperiences(Action):
+    name: str = "RetrieveExperiences"
+    collection_name: str = DEFAULT_COLLECTION_NAME
+    has_experiences: bool = True
+    engine: Optional[SimpleEngine] = None
+    topk: int = 10
+
+    @model_validator(mode="after")
+    def validate_collection(self):
+        if self.engine:
+            return
+        try:
+            self.engine = SimpleEngine.from_index(
+                index_config=ChromaIndexConfig(
+                    persist_path=PERSIST_PATH, collection_name=self.collection_name, metadata={"hnsw:space": "cosine"}
+                ),
+                retriever_configs=[
+                    ChromaRetrieverConfig(
+                        similarity_top_k=self.topk,
+                        persist_path=PERSIST_PATH,
+                        collection_name=self.collection_name,
+                        metadata={"hnsw:space": "cosine"},
+                    )
+                ],
+            )
+        except Exception as exp:
+            logger.warning(f"No experience pool: {self.collection_name}, exp: {exp}")
+
+    def run(self, query: str, profile: str, excluded_version: str = "", verbose: bool = False) -> str:
+        """_summary_
+
+        Args:
+            query (str): 用当前的reflection作为query去检索过去相似的reflection
+            profile (str): _description_
+
+        Returns:
+            _type_: _description_
+        """
+        if not self.engine or len(query) <= 2:  # not "" or not '""'
+            logger.warning("engine is None or query too short")
+            return ""
+
+        # ablation experiment logic
+        if profile == RoleType.WEREWOLF.value:  # role werewolf as baseline, don't use experiences
+            logger.warning("Disable werewolves' experiences")
+            return ""
+
+        results = self.engine.retrieve(query)
+
+        logger.info(f"retrieve {profile}'s experiences")
+        experiences = [res.metadata["obj"] for res in results]
+
+        past_experiences = []  # currently use post-process to filter, and later add `filters` in rag
+        for exp in experiences:
+            if exp.profile == profile and exp.version != excluded_version:
+                past_experiences.append(exp)
+
+        if verbose and results:
+            logger.info("past_experiences: {}".format("\n\n".join(past_experiences)))
+            distances = results[0].score
+            logger.info(f"distances: {distances}")
+
+        template = """
+        {
+            "Situation __i__": "__situation__"
+            ,"Moderator's instruction": "__instruction__"
+            ,"Your action or speech during that time": "__response__"
+            ,"Reality": "In fact, it turned out the true roles are __game_step__",
+            ,"Outcome": "You __outcome__ in the end"
+        }
+        """
+        past_experiences = [
+            (
+                template.replace("__i__", str(i))
+                .replace("__situation__", exp.reflection)
+                .replace("__instruction__", exp.instruction)
+                .replace("__response__", exp.response)
+                .replace("__game_step__", exp.game_setup.replace("0 | Game setup:\n", "").replace("\n", " "))
+                .replace("__outcome__", exp.outcome)
+            )
+            for i, exp in enumerate(past_experiences)
+        ]
+        logger.info("past_experiences: {}".format("\n".join(past_experiences)))
+        logger.info("retrieval done")
+
+        return json.dumps(past_experiences)
diff --git a/metagpt/ext/werewolf/actions/guard_actions.py b/metagpt/ext/werewolf/actions/guard_actions.py
new file mode 100644
index 0000000000..fbacd9aeb1
--- /dev/null
+++ b/metagpt/ext/werewolf/actions/guard_actions.py
@@ -0,0 +1,9 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
+
+from metagpt.ext.werewolf.actions.common_actions import NighttimeWhispers
+
+
+class Protect(NighttimeWhispers):
+    name: str = "Protect"
diff --git a/metagpt/ext/werewolf/actions/moderator_actions.py b/metagpt/ext/werewolf/actions/moderator_actions.py
new file mode 100644
index 0000000000..ba5d13e647
--- /dev/null
+++ b/metagpt/ext/werewolf/actions/moderator_actions.py
@@ -0,0 +1,39 @@
+from metagpt.actions import Action
+from metagpt.environment.werewolf.const import STEP_INSTRUCTIONS
+
+
+class InstructSpeak(Action):
+    name: str = "InstructSpeak"
+
+    async def run(self, step_idx, living_players, werewolf_players, player_hunted, player_current_dead):
+        instruction_info = STEP_INSTRUCTIONS.get(
+            step_idx, {"content": "Unknown instruction.", "send_to": {}, "restricted_to": {}}
+        )
+        content = instruction_info["content"]
+        if "{living_players}" in content and "{werewolf_players}" in content:
+            content = content.format(
+                living_players=living_players, werewolf_players=werewolf_players, werewolf_num=len(werewolf_players)
+            )
+        if "{living_players}" in content:
+            content = content.format(living_players=living_players)
+        if "{werewolf_players}" in content:
+            content = content.format(werewolf_players=werewolf_players)
+        if "{player_hunted}" in content:
+            content = content.format(player_hunted=player_hunted)
+        if "{player_current_dead}" in content:
+            player_current_dead = "No one" if not player_current_dead else player_current_dead
+            content = content.format(player_current_dead=player_current_dead)
+
+        return content, instruction_info["send_to"], instruction_info["restricted_to"]
+
+
+class ParseSpeak(Action):
+    name: str = "ParseSpeak"
+
+    async def run(self):
+        pass
+
+
+class AnnounceGameResult(Action):
+    async def run(self, winner: str, win_reason: str):
+        return f"Game over! {win_reason}. The winner is the {winner}"
diff --git a/metagpt/ext/werewolf/actions/seer_actions.py b/metagpt/ext/werewolf/actions/seer_actions.py
new file mode 100644
index 0000000000..a2c4977c5c
--- /dev/null
+++ b/metagpt/ext/werewolf/actions/seer_actions.py
@@ -0,0 +1,5 @@
+from metagpt.ext.werewolf.actions.common_actions import NighttimeWhispers
+
+
+class Verify(NighttimeWhispers):
+    name: str = "Verify"
diff --git a/metagpt/ext/werewolf/actions/werewolf_actions.py b/metagpt/ext/werewolf/actions/werewolf_actions.py
new file mode 100644
index 0000000000..33dfd44b12
--- /dev/null
+++ b/metagpt/ext/werewolf/actions/werewolf_actions.py
@@ -0,0 +1,17 @@
+from metagpt.ext.werewolf.actions.common_actions import NighttimeWhispers, Speak
+
+
+class Hunt(NighttimeWhispers):
+    name: str = "Hunt"
+
+
+class Impersonate(Speak):
+    """Action: werewolf impersonating a good guy in daytime speak"""
+
+    STRATEGY: str = """
+    Try continuously impersonating a role, such as Seer, Guard, Villager, etc., in order to mislead
+    other players, make them trust you, and thus hiding your werewolf identity. However, pay attention to what your werewolf partner said, 
+    DONT claim the same role as your werewolf partner. Remmber NOT to reveal your real identity as a werewolf!
+    """
+
+    name: str = "Impersonate"
diff --git a/metagpt/ext/werewolf/actions/witch_actions.py b/metagpt/ext/werewolf/actions/witch_actions.py
new file mode 100644
index 0000000000..20a0568c5f
--- /dev/null
+++ b/metagpt/ext/werewolf/actions/witch_actions.py
@@ -0,0 +1,47 @@
+from metagpt.environment.werewolf.const import RoleActionRes
+from metagpt.ext.werewolf.actions.common_actions import NighttimeWhispers
+
+
+class Save(NighttimeWhispers):
+    name: str = "Save"
+
+    def _update_prompt_json(
+        self, prompt_json: dict, role_profile: str, role_name: str, context: str, reflection: str, experiences: str
+    ) -> dict:
+        del prompt_json["ACTION"]
+        del prompt_json["ATTENTION"]
+
+        prompt_json["OUTPUT_FORMAT"][
+            "THOUGHTS"
+        ] = "It is night time. Return the thinking steps of your decision of whether to save the player JUST killed this night."
+        prompt_json["OUTPUT_FORMAT"][
+            "RESPONSE"
+        ] = "Follow the Moderator's instruction, decide whether you want to save that person or not. Return SAVE or PASS."
+
+        return prompt_json
+
+    async def run(self, *args, **kwargs):
+        rsp = await super().run(*args, **kwargs)
+        action_name, rsp = rsp.split()
+        return rsp  # 只需回复SAVE或PASS，不需要带上action名
+
+
+class Poison(NighttimeWhispers):
+    STRATEGY: str = """
+    Only poison a player if you are confident he/she is a werewolf. Don't poison a player randomly or at first night.
+    If someone claims to be the witch, poison him/her, because you are the only witch, he/she can only be a werewolf.
+    """
+
+    name: str = "Poison"
+
+    def _update_prompt_json(
+        self, prompt_json: dict, role_profile: str, role_name: str, context: str, reflection: str, experiences: str
+    ) -> dict:
+        prompt_json["OUTPUT_FORMAT"]["RESPONSE"] += "Or if you want to PASS, return PASS."
+        return prompt_json
+
+    async def run(self, *args, **kwargs):
+        rsp = await super().run(*args, **kwargs)
+        if RoleActionRes.PASS.value in rsp.lower():
+            action_name, rsp = rsp.split()  # 带PASS，只需回复PASS，不需要带上action名，否则是Poison PlayerX，无需改动
+        return rsp
diff --git a/metagpt/ext/werewolf/roles/__init__.py b/metagpt/ext/werewolf/roles/__init__.py
new file mode 100644
index 0000000000..fa9e3a6426
--- /dev/null
+++ b/metagpt/ext/werewolf/roles/__init__.py
@@ -0,0 +1,13 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
+
+from metagpt.ext.werewolf.roles.base_player import BasePlayer
+from metagpt.ext.werewolf.roles.guard import Guard
+from metagpt.ext.werewolf.roles.seer import Seer
+from metagpt.ext.werewolf.roles.villager import Villager
+from metagpt.ext.werewolf.roles.werewolf import Werewolf
+from metagpt.ext.werewolf.roles.witch import Witch
+from metagpt.ext.werewolf.roles.moderator import Moderator
+
+__all__ = ["BasePlayer", "Guard", "Moderator", "Seer", "Villager", "Witch", "Werewolf"]
diff --git a/metagpt/ext/werewolf/roles/base_player.py b/metagpt/ext/werewolf/roles/base_player.py
new file mode 100644
index 0000000000..562ffb7b4b
--- /dev/null
+++ b/metagpt/ext/werewolf/roles/base_player.py
@@ -0,0 +1,176 @@
+import re
+
+from pydantic import Field, SerializeAsAny, model_validator
+
+from metagpt.actions.action import Action
+from metagpt.environment.werewolf.const import RoleState, RoleType
+from metagpt.ext.werewolf.actions import (
+    ACTIONS,
+    AddNewExperiences,
+    InstructSpeak,
+    NighttimeWhispers,
+    Reflect,
+    RetrieveExperiences,
+    Speak,
+)
+from metagpt.ext.werewolf.schema import RoleExperience, WwMessage
+from metagpt.logs import logger
+from metagpt.roles import Role
+from metagpt.utils.common import any_to_str
+
+
+class BasePlayer(Role):
+    name: str = "PlayerXYZ"
+    profile: str = "BasePlayer"
+    special_action_names: list[str] = []
+    use_reflection: bool = True
+    use_experience: bool = False
+    use_memory_selection: bool = False
+    new_experience_version: str = ""
+    status: RoleState = RoleState.ALIVE
+
+    special_actions: list[SerializeAsAny[Action]] = Field(default=[], validate_default=True)
+    experiences: list[RoleExperience] = []
+
+    def __init__(self, **kwargs):
+        super().__init__(**kwargs)
+        # 技能和监听配置
+        self._watch([InstructSpeak])  # 监听Moderator的指令以做行动
+        special_actions = [ACTIONS[action_name] for action_name in self.special_action_names]
+        capable_actions = [Speak] + special_actions
+        self.set_actions(capable_actions)  # 给角色赋予行动技能
+        self.special_actions = special_actions
+
+        if not self.use_reflection and self.use_experience:
+            logger.warning("You must enable use_reflection before using experience")
+            self.use_experience = False
+
+    @model_validator(mode="after")
+    def check_addresses(self):
+        if not self.addresses:
+            self.addresses = {any_to_str(self), self.name, self.profile} if self.name else {any_to_str(self)}
+        return self
+
+    async def _observe(self, ignore_memory=False) -> int:
+        if self.status != RoleState.ALIVE:
+            # 死者不再参与游戏
+            return 0
+        news = []
+        if not news:
+            news = self.rc.msg_buffer.pop_all()
+        old_messages = [] if ignore_memory else self.rc.memory.get()
+        for m in news:
+            if len(m.restricted_to) and self.profile not in m.restricted_to and self.name not in m.restricted_to:
+                # if the msg is not send to the whole audience ("") nor this role (self.profile or self.name),
+                # then this role should not be able to receive it and record it into its memory
+                continue
+            self.rc.memory.add(m)
+        self.rc.news = [
+            n for n in news if (n.cause_by in self.rc.watch or self.profile in n.send_to) and n not in old_messages
+        ]
+
+        # TODO to delete
+        # await super()._observe()
+        # # 只有发给全体的（""）或发给自己的（self.profile）消息需要走下面的_react流程，
+        # # 其他的收听到即可，不用做动作
+        # self.rc.news = [msg for msg in self.rc.news if msg.send_to in ["", self.profile]]
+        return len(self.rc.news)
+
+    async def _think(self):
+        news = self.rc.news[0]
+        assert news.cause_by == any_to_str(InstructSpeak)  # 消息为来自Moderator的指令时，才去做动作
+        if not news.restricted_to:
+            # 消息接收范围为全体角色的，做公开发言（发表投票观点也算发言）
+            self.rc.todo = Speak()
+        elif self.profile in news.restricted_to:
+            # FIXME: hard code to split, restricted为"Moderator"或"Moderator, 角色profile"
+            # Moderator加密发给自己的，意味着要执行角色的特殊动作
+            self.rc.todo = self.special_actions[0]()
+
+    async def _act(self):
+        # todo为_think时确定的，有两种情况，Speak或Protect
+        todo = self.rc.todo
+        logger.info(f"{self._setting}: ready to {str(todo)}")
+
+        # 可以用这个函数获取该角色的全部记忆和最新的instruction
+        memories = self.get_all_memories()
+        latest_instruction = self.get_latest_instruction()
+
+        reflection = (
+            await Reflect().run(
+                profile=self.profile, name=self.name, context=memories, latest_instruction=latest_instruction
+            )
+            if self.use_reflection
+            else ""
+        )
+
+        experiences = (
+            RetrieveExperiences().run(
+                query=reflection, profile=self.profile, excluded_version=self.new_experience_version
+            )
+            if self.use_experience
+            else ""
+        )
+
+        # 根据自己定义的角色Action，对应地去run，run的入参可能不同
+        if isinstance(todo, Speak):
+            rsp = await todo.run(
+                profile=self.profile,
+                name=self.name,
+                context=memories,
+                latest_instruction=latest_instruction,
+                reflection=reflection,
+                experiences=experiences,
+            )
+            restricted_to = set()
+
+        elif isinstance(todo, NighttimeWhispers):
+            rsp = await todo.run(
+                profile=self.profile, name=self.name, context=memories, reflection=reflection, experiences=experiences
+            )
+            restricted_to = {RoleType.MODERATOR.value, self.profile}  # 给Moderator发送使用特殊技能的加密消息
+        msg = WwMessage(
+            content=rsp,
+            role=self.profile,
+            sent_from=self.name,
+            cause_by=type(todo),
+            send_to={},
+            restricted_to=restricted_to,
+        )
+
+        self.experiences.append(
+            RoleExperience(
+                name=self.name,
+                profile=self.profile,
+                reflection=reflection,
+                instruction=latest_instruction,
+                response=rsp,
+                version=self.new_experience_version,
+            )
+        )
+
+        logger.info(f"{self._setting}: {rsp}")
+
+        return msg
+
+    def get_all_memories(self) -> str:
+        memories = self.rc.memory.get()
+        time_stamp_pattern = r"[0-9]+ \| "
+        # NOTE: 除Moderator外，其他角色使用memory，只能用m.sent_from（玩家名）不能用m.role（玩家角色），因为他们不知道说话者的身份
+        memories = [f"{m.sent_from}: {re.sub(time_stamp_pattern, '', m.content)}" for m in memories]  # regex去掉时间戳
+        memories = "\n".join(memories)
+        return memories
+
+    def get_latest_instruction(self) -> str:
+        return self.rc.important_memory[-1].content  # 角色监听着Moderator的InstructSpeak，是其重要记忆，直接获取即可
+
+    def set_status(self, new_status: RoleState):
+        self.status = new_status
+
+    def record_experiences(self, round_id: str, outcome: str, game_setup: str):
+        experiences = [exp for exp in self.experiences if len(exp.reflection) > 2]  # not "" or not '""'
+        for exp in experiences:
+            exp.round_id = round_id
+            exp.outcome = outcome
+            exp.game_setup = game_setup
+        AddNewExperiences().run(experiences)
diff --git a/metagpt/ext/werewolf/roles/guard.py b/metagpt/ext/werewolf/roles/guard.py
new file mode 100644
index 0000000000..a78ee61ef2
--- /dev/null
+++ b/metagpt/ext/werewolf/roles/guard.py
@@ -0,0 +1,8 @@
+from metagpt.environment.werewolf.const import RoleType
+from metagpt.ext.werewolf.roles.base_player import BasePlayer
+
+
+class Guard(BasePlayer):
+    name: str = RoleType.GUARD.value
+    profile: str = RoleType.GUARD.value
+    special_action_names: list[str] = ["Protect"]
diff --git a/metagpt/ext/werewolf/roles/human_player.py b/metagpt/ext/werewolf/roles/human_player.py
new file mode 100644
index 0000000000..4a31dd549a
--- /dev/null
+++ b/metagpt/ext/werewolf/roles/human_player.py
@@ -0,0 +1,45 @@
+from metagpt.environment.werewolf.const import RoleType
+from metagpt.ext.werewolf.actions import Speak
+from metagpt.ext.werewolf.roles import BasePlayer
+from metagpt.ext.werewolf.schema import WwMessage
+from metagpt.logs import logger
+
+
+async def _act(self):
+    todo = self.rc.todo
+
+    memories = self.get_all_memories()
+
+    input_instruction = f"""
+    ## As a reminder, you have access to the following game history:
+    {memories}
+    ## You are {self.name}({self.profile})
+    ## Guidance:
+    1. If you are performing a special action or exercising a vote,
+    end your response with "PlayerX", replace PlayerX with the actual player name, e.g., "..., kill/protect/poison/.../vote Player1".
+    2. If it is a daytime free speech, you can speak in whatever format.
+    Now, please speak:
+    """
+    rsp = input(input_instruction)  # wait for human input
+
+    msg_cause_by = type(todo)
+    msg_restricted_to = {} if isinstance(todo, Speak) else {RoleType.MODERATOR.value, self.profile}
+
+    msg = WwMessage(
+        content=rsp,
+        role=self.profile,
+        sent_from=self.name,
+        cause_by=msg_cause_by,
+        send_to={},
+        restricted_to=msg_restricted_to,  # 给Moderator及自身阵营发送加密消息
+    )
+
+    logger.info(f"{self._setting}: {rsp}")
+
+    return msg
+
+
+def prepare_human_player(player_class: BasePlayer):
+    # Dynamically define a human player class that inherits from a certain role class
+    HumanPlayer = type("HumanPlayer", (player_class,), {"_act": _act})
+    return HumanPlayer
diff --git a/metagpt/ext/werewolf/roles/moderator.py b/metagpt/ext/werewolf/roles/moderator.py
new file mode 100644
index 0000000000..7de0b74e69
--- /dev/null
+++ b/metagpt/ext/werewolf/roles/moderator.py
@@ -0,0 +1,251 @@
+import re
+from datetime import datetime
+from typing import Union
+
+from metagpt.actions.add_requirement import UserRequirement
+from metagpt.const import DEFAULT_WORKSPACE_ROOT, MESSAGE_ROUTE_TO_ALL
+from metagpt.environment.werewolf.const import (
+    STEP_INSTRUCTIONS,
+    RoleActionRes,
+    RoleState,
+    RoleType,
+)
+from metagpt.environment.werewolf.env_space import EnvAction, EnvActionType
+from metagpt.ext.werewolf.actions import Hunt, Poison, Protect, Save, Verify
+from metagpt.ext.werewolf.actions.moderator_actions import (
+    AnnounceGameResult,
+    InstructSpeak,
+    ParseSpeak,
+)
+from metagpt.ext.werewolf.roles.base_player import BasePlayer
+from metagpt.ext.werewolf.schema import WwMessage
+from metagpt.logs import logger
+from metagpt.utils.common import any_to_str
+
+
+class Moderator(BasePlayer):
+    name: str = RoleType.MODERATOR.value
+    profile: str = RoleType.MODERATOR.value
+
+    def __init__(self, **kwargs):
+        super().__init__(**kwargs)
+        self._watch([UserRequirement, InstructSpeak, ParseSpeak])
+        self.set_actions([InstructSpeak, ParseSpeak, AnnounceGameResult])
+
+        # game states
+        self.step_idx = 0
+        self.game_setup = ""
+        self.werewolf_players = []
+        self.winner = None
+        self.win_reason = None
+        self.witch_poison_left = 1
+        self.witch_antidote_left = 1
+
+    def update_player_status(self, player_names: list[str]):
+        if not player_names:
+            return
+        roles_in_env = self.rc.env.get_roles()
+        for role_setting, role in roles_in_env.items():
+            for player_name in player_names:
+                if player_name in role_setting:
+                    role.set_status(new_status=RoleState.DEAD)  # 更新为死亡
+
+    def _record_all_experiences(self):
+        logger.info(f"The winner of the game: {self.winner}, start to record roles' experiences")
+        roles_in_env = self.rc.env.get_roles()
+        timestamp = datetime.now().strftime("%Y_%m_%d_%H_%M_%S")
+        for _, role in roles_in_env.items():
+            if role == self:
+                continue
+            if self.winner == "werewolf":
+                outcome = "won" if role.profile in RoleType.WEREWOLF.value else "lost"
+            else:
+                outcome = "won" if role.profile not in RoleType.WEREWOLF.value else "lost"
+            role.record_experiences(round_id=timestamp, outcome=outcome, game_setup=self.game_setup)
+
+    async def _parse_speak(self, memories):
+        latest_msg = memories[-1]
+        latest_msg_content = latest_msg.content
+
+        match = re.search(r"Player[0-9]+", latest_msg_content[-10:])  # FIXME: hard code truncation
+        target = match.group(0) if match else ""
+
+        # default return
+        msg_content = "Understood"
+        restricted_to = set()
+
+        msg_cause_by = latest_msg.cause_by
+        if msg_cause_by == any_to_str(Hunt):
+            self.rc.env.step(
+                EnvAction(
+                    action_type=EnvActionType.WOLF_KILL, player_name=latest_msg.sent_from, target_player_name=target
+                )
+            )
+        elif msg_cause_by == any_to_str(Protect):
+            self.rc.env.step(
+                EnvAction(
+                    action_type=EnvActionType.GUARD_PROTECT, player_name=latest_msg.sent_from, target_player_name=target
+                )
+            )
+        elif msg_cause_by == any_to_str(Verify):
+            if target in self.werewolf_players:
+                msg_content = f"{target} is a werewolf"
+            else:
+                msg_content = f"{target} is a good guy"
+            restricted_to = {RoleType.MODERATOR.value, RoleType.SEER.value}
+        elif msg_cause_by == any_to_str(Save):
+            if RoleActionRes.PASS.value in latest_msg_content.lower():
+                # the role ignore to response, answer `pass`
+                pass
+            elif not self.witch_antidote_left:
+                msg_content = "You have no antidote left and thus can not save the player"
+                restricted_to = {RoleType.MODERATOR.value, RoleType.WITCH.value}
+            else:
+                self.rc.env.step(
+                    EnvAction(
+                        action_type=EnvActionType.WITCH_SAVE,
+                        player_name=latest_msg.sent_from,
+                        target_player_name=target,
+                    )
+                )
+        elif msg_cause_by == any_to_str(Poison):
+            if RoleActionRes.PASS.value in latest_msg_content.lower():
+                pass
+            elif not self.witch_poison_left:
+                msg_content = "You have no poison left and thus can not poison the player"
+                restricted_to = {RoleType.MODERATOR.value, RoleType.WITCH.value}
+            else:
+                self.rc.env.step(
+                    EnvAction(
+                        action_type=EnvActionType.WITCH_POISON,
+                        player_name=latest_msg.sent_from,
+                        target_player_name=target,
+                    )
+                )
+
+        return msg_content, restricted_to
+
+    def _update_player_status(self, step_idx: int, player_current_dead: list[str]):
+        """update dead player's status"""
+        if step_idx in [15, 18]:
+            self.update_player_status(player_current_dead)
+
+    def _record_game_history(self, step_idx: int):
+        if step_idx and step_idx % len(STEP_INSTRUCTIONS) == 0 or self.winner:
+            logger.info("a night and day cycle completed, examine all history")
+            logger.debug(f"all_memories: {self.get_all_memories()}")
+            with open(DEFAULT_WORKSPACE_ROOT / "werewolf_transcript.txt", "w") as f:
+                f.write(self.get_all_memories())
+
+    async def _observe(self, ignore_memory=False) -> int:
+        news = []
+        if not news:
+            news = self.rc.msg_buffer.pop_all()
+        old_messages = [] if ignore_memory else self.rc.memory.get()
+        for m in news:
+            if len(m.restricted_to) and self.profile not in m.restricted_to and self.name not in m.restricted_to:
+                # if the msg is not send to the whole audience ("") nor this role (self.profile or self.name),
+                # then this role should not be able to receive it and record it into its memory
+                continue
+            self.rc.memory.add(m)
+        # add `MESSAGE_ROUTE_TO_ALL in n.send_to` make it to run `ParseSpeak`
+        self.rc.news = [
+            n
+            for n in news
+            if (n.cause_by in self.rc.watch or self.profile in n.send_to or MESSAGE_ROUTE_TO_ALL in n.send_to)
+            and n not in old_messages
+        ]
+        return len(self.rc.news)
+
+    async def _think(self):
+        if self.winner:
+            self.rc.todo = AnnounceGameResult()
+            return
+
+        latest_msg = self.rc.memory.get()[-1]
+        if latest_msg.role in ["User", "Human", self.profile]:
+            # 1. 上一轮消息是用户指令，解析用户指令，开始游戏
+            # 2.1. 上一轮消息是Moderator自己的指令，继续发出指令，一个事情可以分几条消息来说
+            # 2.2. 上一轮消息是Moderator自己的解析消息，一个阶段结束，发出新一个阶段的指令
+            self.rc.todo = InstructSpeak()
+        else:
+            # 上一轮消息是游戏角色的发言，解析角色的发言
+            self.rc.todo = ParseSpeak()
+
+    def _init_fields_from_obj(self, obs: dict[str, Union[int, str, list[str]]]):
+        self.game_setup = obs.get("game_setup", "")
+        self.step_idx = obs.get("step_idx", 0)
+        self.winner = obs.get("winner")
+        self.win_reason = obs.get("win_reason")
+        self.werewolf_players = obs.get("werewolf_players", [])
+        self.witch_poison_left = obs.get("witch_poison_left", 0)
+        self.witch_antidote_left = obs.get("witch_antidote_left", 0)
+
+    async def _act(self):
+        todo = self.rc.todo
+        logger.info(f"{self._setting} ready to {todo}")
+
+        memories = self.get_all_memories(mode="msg")
+
+        obs, _, _, _, _ = self.rc.env.step(action=EnvAction(action_type=EnvActionType.NONE))
+        living_players = obs["living_players"]
+        werewolf_players = obs["werewolf_players"]
+        player_hunted = obs["player_hunted"]
+        player_current_dead = obs["player_current_dead"]
+        self._init_fields_from_obj(obs)
+
+        # 若进行完一夜一日的循环，打印和记录一次完整发言历史
+        self._record_game_history(self.step_idx)
+
+        # 若一晚或一日周期结束，对当晚或当日的死者进行总结，并更新玩家状态
+        self._update_player_status(self.step_idx, player_current_dead)
+        if self.winner:
+            self._record_all_experiences()
+
+        # 根据_think的结果，执行InstructSpeak还是ParseSpeak, 并将结果返回
+        if isinstance(todo, InstructSpeak):
+            msg_content, msg_to_send_to, msg_restricted_to = await InstructSpeak().run(
+                self.step_idx,
+                living_players=living_players,
+                werewolf_players=werewolf_players,
+                player_hunted=player_hunted,
+                player_current_dead=player_current_dead,
+            )
+            # msg_content = f"Step {self.step_idx}: {msg_content}" # HACK: 加一个unique的step_idx避免记忆的自动去重
+            msg = WwMessage(
+                content=msg_content,
+                role=self.profile,
+                sent_from=self.name,
+                cause_by=InstructSpeak,
+                send_to=msg_to_send_to,
+                restricted_to=msg_restricted_to,
+            )
+            logger.info(f"current step_idx: {self.step_idx}")
+            self.rc.env.step(EnvAction(action_type=EnvActionType.PROGRESS_STEP))  # to update step_idx
+
+        elif isinstance(todo, ParseSpeak):
+            msg_content, msg_restricted_to = await self._parse_speak(memories)
+            # msg_content = f"Step {self.step_idx}: {msg_content}" # HACK: 加一个unique的step_idx避免记忆的自动去重
+            msg = WwMessage(
+                content=msg_content,
+                role=self.profile,
+                sent_from=self.name,
+                cause_by=ParseSpeak,
+                send_to={},
+                restricted_to=msg_restricted_to,
+            )
+
+        elif isinstance(todo, AnnounceGameResult):
+            msg_content = await AnnounceGameResult().run(winner=self.winner, win_reason=self.win_reason)
+            msg = WwMessage(content=msg_content, role=self.profile, sent_from=self.name, cause_by=AnnounceGameResult)
+
+        logger.info(f"{self._setting}: {msg_content}")
+
+        return msg
+
+    def get_all_memories(self, mode="str") -> str:
+        memories = self.rc.memory.get()
+        if mode == "str":
+            memories = [f"{m.sent_from}({m.role}): {m.content}" for m in memories]
+            memories = "\n".join(memories)
+        return memories
diff --git a/metagpt/ext/werewolf/roles/seer.py b/metagpt/ext/werewolf/roles/seer.py
new file mode 100644
index 0000000000..c669ac28d7
--- /dev/null
+++ b/metagpt/ext/werewolf/roles/seer.py
@@ -0,0 +1,8 @@
+from metagpt.environment.werewolf.const import RoleType
+from metagpt.ext.werewolf.roles.base_player import BasePlayer
+
+
+class Seer(BasePlayer):
+    name: str = RoleType.SEER.value
+    profile: str = RoleType.SEER.value
+    special_action_names: list[str] = ["Verify"]
diff --git a/metagpt/ext/werewolf/roles/villager.py b/metagpt/ext/werewolf/roles/villager.py
new file mode 100644
index 0000000000..55b048a077
--- /dev/null
+++ b/metagpt/ext/werewolf/roles/villager.py
@@ -0,0 +1,8 @@
+from metagpt.environment.werewolf.const import RoleType
+from metagpt.ext.werewolf.roles.base_player import BasePlayer
+
+
+class Villager(BasePlayer):
+    name: str = RoleType.VILLAGER.value
+    profile: str = RoleType.VILLAGER.value
+    special_action_names: list[str] = []
diff --git a/metagpt/ext/werewolf/roles/werewolf.py b/metagpt/ext/werewolf/roles/werewolf.py
new file mode 100644
index 0000000000..801bc7d25f
--- /dev/null
+++ b/metagpt/ext/werewolf/roles/werewolf.py
@@ -0,0 +1,15 @@
+from metagpt.environment.werewolf.const import RoleType
+from metagpt.ext.werewolf.actions import Impersonate, Speak
+from metagpt.ext.werewolf.roles.base_player import BasePlayer
+
+
+class Werewolf(BasePlayer):
+    name: str = RoleType.WEREWOLF.value
+    profile: str = RoleType.WEREWOLF.value
+    special_action_names: list[str] = ["Hunt"]
+
+    async def _think(self):
+        """狼人白天发言时需要伪装，与其他角色不同，因此需要重写_think"""
+        await super()._think()
+        if isinstance(self.rc.todo, Speak):
+            self.rc.todo = Impersonate()
diff --git a/metagpt/ext/werewolf/roles/witch.py b/metagpt/ext/werewolf/roles/witch.py
new file mode 100644
index 0000000000..2b73ea6297
--- /dev/null
+++ b/metagpt/ext/werewolf/roles/witch.py
@@ -0,0 +1,28 @@
+from metagpt.environment.werewolf.const import RoleType
+from metagpt.ext.werewolf.actions import InstructSpeak, Poison, Save, Speak
+from metagpt.ext.werewolf.roles.base_player import BasePlayer
+from metagpt.utils.common import any_to_str
+
+
+class Witch(BasePlayer):
+    name: str = RoleType.WITCH.value
+    profile: str = RoleType.WITCH.value
+    special_action_names: list[str] = ["Save", "Poison"]
+
+    async def _think(self):
+        """女巫涉及两个特殊技能，因此在此需要改写_think进行路由"""
+        news = self.rc.news[0]
+        assert news.cause_by == any_to_str(InstructSpeak)  # 消息为来自Moderator的指令时，才去做动作
+        if not news.restricted_to:
+            # 消息接收范围为全体角色的，做公开发言（发表投票观点也算发言）
+            self.rc.todo = Speak()
+        elif self.profile in news.restricted_to:
+            # FIXME: hard code to split, restricted为"Moderator"或"Moderator,角色profile"
+            # Moderator加密发给自己的，意味着要执行角色的特殊动作
+            # 这里用关键词进行动作的选择，需要Moderator侧的指令进行配合
+            if "save" in news.content.lower():
+                self.rc.todo = Save()
+            elif "poison" in news.content.lower():
+                self.rc.todo = Poison()
+            else:
+                raise ValueError("Moderator's instructions must include save or poison keyword")
diff --git a/metagpt/ext/werewolf/schema.py b/metagpt/ext/werewolf/schema.py
new file mode 100644
index 0000000000..1502a2391b
--- /dev/null
+++ b/metagpt/ext/werewolf/schema.py
@@ -0,0 +1,33 @@
+from typing import Any
+
+from pydantic import BaseModel, Field, field_validator
+
+from metagpt.schema import Message
+from metagpt.utils.common import any_to_str_set
+
+
+class RoleExperience(BaseModel):
+    id: str = ""
+    name: str = ""
+    profile: str
+    reflection: str
+    instruction: str = ""
+    response: str
+    outcome: str = ""
+    round_id: str = ""
+    game_setup: str = ""
+    version: str = ""
+
+    def rag_key(self) -> str:
+        """For search"""
+        return self.reflection
+
+
+class WwMessage(Message):
+    # Werewolf Message
+    restricted_to: set[str] = Field(default=set(), validate_default=True)
+
+    @field_validator("restricted_to", mode="before")
+    @classmethod
+    def check_restricted_to(cls, restricted_to: Any):
+        return any_to_str_set(restricted_to if restricted_to else set())
diff --git a/metagpt/ext/werewolf/werewolf_game.py b/metagpt/ext/werewolf/werewolf_game.py
new file mode 100644
index 0000000000..4deb831a00
--- /dev/null
+++ b/metagpt/ext/werewolf/werewolf_game.py
@@ -0,0 +1,28 @@
+from typing import Any, Optional
+
+from metagpt.actions.add_requirement import UserRequirement
+from metagpt.context import Context
+from metagpt.environment.werewolf.werewolf_env import WerewolfEnv
+from metagpt.ext.werewolf.schema import WwMessage
+from metagpt.team import Team
+
+
+class WerewolfGame(Team):
+    """Use the "software company paradigm" to hold a werewolf game"""
+
+    env: Optional[WerewolfEnv] = None
+
+    def __init__(self, context: Context = None, **data: Any):
+        super(Team, self).__init__(**data)
+        ctx = context or Context()
+        if not self.env:
+            self.env = WerewolfEnv(context=ctx)
+        else:
+            self.env.context = ctx  # The `env` object is allocated by deserialization
+
+    def run_project(self, idea):
+        """Run a project from user instruction."""
+        self.idea = idea
+        self.env.publish_message(
+            WwMessage(role="User", content=idea, cause_by=UserRequirement, restricted_to={"Moderator"})
+        )
diff --git a/metagpt/learn/skill_loader.py b/metagpt/learn/skill_loader.py
index bcf28bb878..e98f73cf98 100644
--- a/metagpt/learn/skill_loader.py
+++ b/metagpt/learn/skill_loader.py
@@ -9,11 +9,11 @@
 from pathlib import Path
 from typing import Dict, List, Optional
 
-import aiofiles
 import yaml
 from pydantic import BaseModel, Field
 
 from metagpt.context import Context
+from metagpt.utils.common import aread
 
 
 class Example(BaseModel):
@@ -68,8 +68,7 @@ class SkillsDeclaration(BaseModel):
     async def load(skill_yaml_file_name: Path = None) -> "SkillsDeclaration":
         if not skill_yaml_file_name:
             skill_yaml_file_name = Path(__file__).parent.parent.parent / "docs/.well-known/skills.yaml"
-        async with aiofiles.open(str(skill_yaml_file_name), mode="r") as reader:
-            data = await reader.read(-1)
+        data = await aread(filename=skill_yaml_file_name)
         skill_data = yaml.safe_load(data)
         return SkillsDeclaration(**skill_data)
 
diff --git a/metagpt/logs.py b/metagpt/logs.py
index 90bac21aaf..7ab51ff8e7 100644
--- a/metagpt/logs.py
+++ b/metagpt/logs.py
@@ -8,15 +8,19 @@
 
 import sys
 from datetime import datetime
-from functools import partial
 
 from loguru import logger as _logger
 
 from metagpt.const import METAGPT_ROOT
 
+_print_level = "INFO"
+
 
 def define_log_level(print_level="INFO", logfile_level="DEBUG", name: str = None):
     """Adjust the log level to above level"""
+    global _print_level
+    _print_level = print_level
+
     current_date = datetime.now()
     formatted_date = current_date.strftime("%Y%m%d")
     log_name = f"{name}_{formatted_date}" if name else formatted_date  # name a log with prefix name
@@ -39,4 +43,6 @@ def set_llm_stream_logfunc(func):
     _llm_stream_log = func
 
 
-_llm_stream_log = partial(print, end="")
+def _llm_stream_log(msg):
+    if _print_level in ["INFO"]:
+        print(msg, end="")
diff --git a/metagpt/memory/longterm_memory.py b/metagpt/memory/longterm_memory.py
index 5a139a93b2..e960ad6ec6 100644
--- a/metagpt/memory/longterm_memory.py
+++ b/metagpt/memory/longterm_memory.py
@@ -29,16 +29,14 @@ class LongTermMemory(Memory):
     msg_from_recover: bool = False
 
     def recover_memory(self, role_id: str, rc: RoleContext):
-        messages = self.memory_storage.recover_memory(role_id)
+        self.memory_storage.recover_memory(role_id)
         self.rc = rc
         if not self.memory_storage.is_initialized:
-            logger.warning(f"It may the first time to run Agent {role_id}, the long-term memory is empty")
+            logger.warning(f"It may the first time to run Role {role_id}, the long-term memory is empty")
         else:
-            logger.warning(
-                f"Agent {role_id} has existing memory storage with {len(messages)} messages " f"and has recovered them."
-            )
+            logger.warning(f"Role {role_id} has existing memory storage and has recovered them.")
         self.msg_from_recover = True
-        self.add_batch(messages)
+        # self.add_batch(messages) # TODO no need
         self.msg_from_recover = False
 
     def add(self, message: Message):
@@ -49,7 +47,7 @@ def add(self, message: Message):
                 # and ignore adding messages from recover repeatedly
                 self.memory_storage.add(message)
 
-    def find_news(self, observed: list[Message], k=0) -> list[Message]:
+    async def find_news(self, observed: list[Message], k=0) -> list[Message]:
         """
         find news (previously unseen messages) from the the most recent k memories, from all memories when k=0
             1. find the short-term memory(stm) news
@@ -63,11 +61,14 @@ def find_news(self, observed: list[Message], k=0) -> list[Message]:
         ltm_news: list[Message] = []
         for mem in stm_news:
             # filter out messages similar to those seen previously in ltm, only keep fresh news
-            mem_searched = self.memory_storage.search_dissimilar(mem)
-            if len(mem_searched) > 0:
+            mem_searched = await self.memory_storage.search_similar(mem)
+            if len(mem_searched) == 0:
                 ltm_news.append(mem)
         return ltm_news[-k:]
 
+    def persist(self):
+        self.memory_storage.persist()
+
     def delete(self, message: Message):
         super().delete(message)
         # TODO delete message in memory_storage
diff --git a/metagpt/memory/memory_storage.py b/metagpt/memory/memory_storage.py
index fa04d8138f..88ab490288 100644
--- a/metagpt/memory/memory_storage.py
+++ b/metagpt/memory/memory_storage.py
@@ -3,115 +3,75 @@
 """
 @Desc   : the implement of memory storage
 """
-
+import shutil
 from pathlib import Path
-from typing import Optional
 
-from langchain.vectorstores.faiss import FAISS
-from langchain_core.embeddings import Embeddings
+from llama_index.core.embeddings import BaseEmbedding
 
 from metagpt.const import DATA_PATH, MEM_TTL
-from metagpt.document_store.faiss_store import FaissStore
 from metagpt.logs import logger
+from metagpt.rag.engines.simple import SimpleEngine
+from metagpt.rag.schema import FAISSIndexConfig, FAISSRetrieverConfig
 from metagpt.schema import Message
 from metagpt.utils.embedding import get_embedding
-from metagpt.utils.serialize import deserialize_message, serialize_message
 
 
-class MemoryStorage(FaissStore):
+class MemoryStorage(object):
     """
     The memory storage with Faiss as ANN search engine
     """
 
-    def __init__(self, mem_ttl: int = MEM_TTL, embedding: Embeddings = None):
+    def __init__(self, mem_ttl: int = MEM_TTL, embedding: BaseEmbedding = None):
         self.role_id: str = None
         self.role_mem_path: str = None
         self.mem_ttl: int = mem_ttl  # later use
         self.threshold: float = 0.1  # experience value. TODO The threshold to filter similar memories
         self._initialized: bool = False
-
         self.embedding = embedding or get_embedding()
-        self.store: FAISS = None  # Faiss engine
+
+        self.faiss_engine = None
 
     @property
     def is_initialized(self) -> bool:
         return self._initialized
 
-    def _load(self) -> Optional["FaissStore"]:
-        index_file, store_file = self._get_index_and_store_fname(index_ext=".faiss")  # langchain FAISS using .faiss
-
-        if not (index_file.exists() and store_file.exists()):
-            logger.info("Missing at least one of index_file/store_file, load failed and return None")
-            return None
-
-        return FAISS.load_local(self.role_mem_path, self.embedding, self.role_id)
-
     def recover_memory(self, role_id: str) -> list[Message]:
         self.role_id = role_id
         self.role_mem_path = Path(DATA_PATH / f"role_mem/{self.role_id}/")
         self.role_mem_path.mkdir(parents=True, exist_ok=True)
-
-        self.store = self._load()
-        messages = []
-        if not self.store:
-            # TODO init `self.store` under here with raw faiss api instead under `add`
-            pass
+        self.cache_dir = self.role_mem_path
+
+        if self.role_mem_path.joinpath("default__vector_store.json").exists():
+            self.faiss_engine = SimpleEngine.from_index(
+                index_config=FAISSIndexConfig(persist_path=self.cache_dir),
+                retriever_configs=[FAISSRetrieverConfig()],
+                embed_model=self.embedding,
+            )
         else:
-            for _id, document in self.store.docstore._dict.items():
-                messages.append(deserialize_message(document.metadata.get("message_ser")))
-            self._initialized = True
-
-        return messages
-
-    def _get_index_and_store_fname(self, index_ext=".index", pkl_ext=".pkl"):
-        if not self.role_mem_path:
-            logger.error(f"You should call {self.__class__.__name__}.recover_memory fist when using LongTermMemory")
-            return None, None
-        index_fpath = Path(self.role_mem_path / f"{self.role_id}{index_ext}")
-        storage_fpath = Path(self.role_mem_path / f"{self.role_id}{pkl_ext}")
-        return index_fpath, storage_fpath
-
-    def persist(self):
-        self.store.save_local(self.role_mem_path, self.role_id)
-        logger.debug(f"Agent {self.role_id} persist memory into local")
+            self.faiss_engine = SimpleEngine.from_objs(
+                objs=[], retriever_configs=[FAISSRetrieverConfig()], embed_model=self.embedding
+            )
+        self._initialized = True
 
     def add(self, message: Message) -> bool:
         """add message into memory storage"""
-        docs = [message.content]
-        metadatas = [{"message_ser": serialize_message(message)}]
-        if not self.store:
-            # init Faiss
-            self.store = self._write(docs, metadatas)
-            self._initialized = True
-        else:
-            self.store.add_texts(texts=docs, metadatas=metadatas)
-        self.persist()
-        logger.info(f"Agent {self.role_id}'s memory_storage add a message")
+        self.faiss_engine.add_objs([message])
+        logger.info(f"Role {self.role_id}'s memory_storage add a message")
 
-    def search_dissimilar(self, message: Message, k=4) -> list[Message]:
-        """search for dissimilar messages"""
-        if not self.store:
-            return []
-
-        resp = self.store.similarity_search_with_score(query=message.content, k=k)
+    async def search_similar(self, message: Message, k=4) -> list[Message]:
+        """search for similar messages"""
         # filter the result which score is smaller than the threshold
         filtered_resp = []
-        for item, score in resp:
-            # the smaller score means more similar relation
-            if score < self.threshold:
-                continue
-            # convert search result into Memory
-            metadata = item.metadata
-            new_mem = deserialize_message(metadata.get("message_ser"))
-            filtered_resp.append(new_mem)
+        resp = await self.faiss_engine.aretrieve(message.content)
+        for item in resp:
+            if item.score < self.threshold:
+                filtered_resp.append(item.metadata.get("obj"))
         return filtered_resp
 
     def clean(self):
-        index_fpath, storage_fpath = self._get_index_and_store_fname()
-        if index_fpath and index_fpath.exists():
-            index_fpath.unlink(missing_ok=True)
-        if storage_fpath and storage_fpath.exists():
-            storage_fpath.unlink(missing_ok=True)
-
-        self.store = None
+        shutil.rmtree(self.cache_dir, ignore_errors=True)
         self._initialized = False
+
+    def persist(self):
+        if self.faiss_engine:
+            self.faiss_engine.retriever._index.storage_context.persist(self.cache_dir)
diff --git a/metagpt/provider/anthropic_api.py b/metagpt/provider/anthropic_api.py
index 872f9b2c7f..1aeacbe83b 100644
--- a/metagpt/provider/anthropic_api.py
+++ b/metagpt/provider/anthropic_api.py
@@ -5,6 +5,7 @@
 from anthropic.types import Message, Usage
 
 from metagpt.configs.llm_config import LLMConfig, LLMType
+from metagpt.const import USE_CONFIG_TIMEOUT
 from metagpt.logs import log_llm_stream
 from metagpt.provider.base_llm import BaseLLM
 from metagpt.provider.llm_provider_registry import register_provider
@@ -41,15 +42,15 @@ def _update_costs(self, usage: Usage, model: str = None, local_calc_usage: bool
     def get_choice_text(self, resp: Message) -> str:
         return resp.content[0].text
 
-    async def _achat_completion(self, messages: list[dict], timeout: int = 3) -> Message:
+    async def _achat_completion(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> Message:
         resp: Message = await self.aclient.messages.create(**self._const_kwargs(messages))
         self._update_costs(resp.usage, self.model)
         return resp
 
-    async def acompletion(self, messages: list[dict], timeout: int = 3) -> Message:
-        return await self._achat_completion(messages, timeout=timeout)
+    async def acompletion(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> Message:
+        return await self._achat_completion(messages, timeout=self.get_timeout(timeout))
 
-    async def _achat_completion_stream(self, messages: list[dict], timeout: int = 3) -> str:
+    async def _achat_completion_stream(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> str:
         stream = await self.aclient.messages.create(**self._const_kwargs(messages, stream=True))
         collected_content = []
         usage = Usage(input_tokens=0, output_tokens=0)
diff --git a/metagpt/provider/base_llm.py b/metagpt/provider/base_llm.py
index fa14496aa5..db2757ec33 100644
--- a/metagpt/provider/base_llm.py
+++ b/metagpt/provider/base_llm.py
@@ -10,10 +10,9 @@
 
 import json
 from abc import ABC, abstractmethod
-from typing import Dict, Optional, Union
+from typing import Optional, Union
 
 from openai import AsyncOpenAI
-from openai.types import CompletionUsage
 from pydantic import BaseModel
 from tenacity import (
     after_log,
@@ -24,11 +23,11 @@
 )
 
 from metagpt.configs.llm_config import LLMConfig
+from metagpt.const import LLM_API_TIMEOUT, USE_CONFIG_TIMEOUT
 from metagpt.logs import logger
 from metagpt.schema import Message
 from metagpt.utils.common import log_and_reraise
 from metagpt.utils.cost_manager import CostManager, Costs
-from metagpt.utils.exceptions import handle_exception
 
 
 class BaseLLM(ABC):
@@ -41,7 +40,7 @@ class BaseLLM(ABC):
     # OpenAI / Azure / Others
     aclient: Optional[Union[AsyncOpenAI]] = None
     cost_manager: Optional[CostManager] = None
-    model: Optional[str] = None
+    model: Optional[str] = None  # deprecated
     pricing_plan: Optional[str] = None
 
     @abstractmethod
@@ -75,6 +74,28 @@ def _assistant_msg(self, msg: str) -> dict[str, str]:
     def _system_msg(self, msg: str) -> dict[str, str]:
         return {"role": "system", "content": msg}
 
+    def format_msg(self, messages: Union[str, Message, list[dict], list[Message], list[str]]) -> list[dict]:
+        """convert messages to list[dict]."""
+        from metagpt.schema import Message
+
+        if not isinstance(messages, list):
+            messages = [messages]
+
+        processed_messages = []
+        for msg in messages:
+            if isinstance(msg, str):
+                processed_messages.append({"role": "user", "content": msg})
+            elif isinstance(msg, dict):
+                assert set(msg.keys()) == set(["role", "content"])
+                processed_messages.append(msg)
+            elif isinstance(msg, Message):
+                processed_messages.append(msg.to_dict())
+            else:
+                raise ValueError(
+                    f"Only support message type are: str, Message, dict, but got {type(messages).__name__}!"
+                )
+        return processed_messages
+
     def _system_msgs(self, msgs: list[str]) -> list[dict[str, str]]:
         return [self._system_msg(msg) for msg in msgs]
 
@@ -88,6 +109,7 @@ def _update_costs(self, usage: Union[dict, BaseModel], model: str = None, local_
             local_calc_usage (bool): some models don't calculate usage, it will overwrite LLMConfig.calc_usage
         """
         calc_usage = self.config.calc_usage and local_calc_usage
+        model = model or self.pricing_plan
         model = model or self.model
         usage = usage.model_dump() if isinstance(usage, BaseModel) else usage
         if calc_usage and self.cost_manager:
@@ -109,7 +131,7 @@ async def aask(
         system_msgs: Optional[list[str]] = None,
         format_msgs: Optional[list[dict[str, str]]] = None,
         images: Optional[Union[str, list[str]]] = None,
-        timeout=3,
+        timeout=USE_CONFIG_TIMEOUT,
         stream=True,
     ) -> str:
         if system_msgs:
@@ -125,31 +147,31 @@ async def aask(
         else:
             message.extend(msg)
         logger.debug(message)
-        rsp = await self.acompletion_text(message, stream=stream, timeout=timeout)
+        rsp = await self.acompletion_text(message, stream=stream, timeout=self.get_timeout(timeout))
         return rsp
 
     def _extract_assistant_rsp(self, context):
         return "\n".join([i["content"] for i in context if i["role"] == "assistant"])
 
-    async def aask_batch(self, msgs: list, timeout=3) -> str:
+    async def aask_batch(self, msgs: list, timeout=USE_CONFIG_TIMEOUT) -> str:
         """Sequential questioning"""
         context = []
         for msg in msgs:
             umsg = self._user_msg(msg)
             context.append(umsg)
-            rsp_text = await self.acompletion_text(context, timeout=timeout)
+            rsp_text = await self.acompletion_text(context, timeout=self.get_timeout(timeout))
             context.append(self._assistant_msg(rsp_text))
         return self._extract_assistant_rsp(context)
 
-    async def aask_code(self, messages: Union[str, Message, list[dict]], timeout=3, **kwargs) -> dict:
+    async def aask_code(self, messages: Union[str, Message, list[dict]], timeout=USE_CONFIG_TIMEOUT, **kwargs) -> dict:
         raise NotImplementedError
 
     @abstractmethod
-    async def _achat_completion(self, messages: list[dict], timeout=3):
+    async def _achat_completion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT):
         """_achat_completion implemented by inherited class"""
 
     @abstractmethod
-    async def acompletion(self, messages: list[dict], timeout=3):
+    async def acompletion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT):
         """Asynchronous version of completion
         All GPTAPIs are required to provide the standard OpenAI completion interface
         [
@@ -160,7 +182,7 @@ async def acompletion(self, messages: list[dict], timeout=3):
         """
 
     @abstractmethod
-    async def _achat_completion_stream(self, messages: list[dict], timeout: int = 3) -> str:
+    async def _achat_completion_stream(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> str:
         """_achat_completion_stream implemented by inherited class"""
 
     @retry(
@@ -170,11 +192,13 @@ async def _achat_completion_stream(self, messages: list[dict], timeout: int = 3)
         retry=retry_if_exception_type(ConnectionError),
         retry_error_callback=log_and_reraise,
     )
-    async def acompletion_text(self, messages: list[dict], stream: bool = False, timeout: int = 3) -> str:
+    async def acompletion_text(
+        self, messages: list[dict], stream: bool = False, timeout: int = USE_CONFIG_TIMEOUT
+    ) -> str:
         """Asynchronous version of completion. Return str. Support stream-print"""
         if stream:
-            return await self._achat_completion_stream(messages, timeout=timeout)
-        resp = await self._achat_completion(messages, timeout=timeout)
+            return await self._achat_completion_stream(messages, timeout=self.get_timeout(timeout))
+        resp = await self._achat_completion(messages, timeout=self.get_timeout(timeout))
         return self.get_choice_text(resp)
 
     def get_choice_text(self, rsp: dict) -> str:
@@ -225,20 +249,6 @@ def get_choice_function_arguments(self, rsp: dict) -> dict:
         """
         return json.loads(self.get_choice_function(rsp)["arguments"], strict=False)
 
-    @handle_exception
-    def _update_costs(self, usage: CompletionUsage | Dict):
-        """
-        Updates the costs based on the provided usage information.
-        """
-        if self.config.calc_usage and usage and self.cost_manager:
-            if isinstance(usage, Dict):
-                prompt_tokens = int(usage.get("prompt_tokens", 0))
-                completion_tokens = int(usage.get("completion_tokens", 0))
-            else:
-                prompt_tokens = usage.prompt_tokens
-                completion_tokens = usage.completion_tokens
-            self.cost_manager.update_cost(prompt_tokens, completion_tokens, self.pricing_plan)
-
     def messages_to_prompt(self, messages: list[dict]):
         """[{"role": "user", "content": msg}] to user: <msg> etc."""
         return "\n".join([f"{i['role']}: {i['content']}" for i in messages])
@@ -246,3 +256,11 @@ def messages_to_prompt(self, messages: list[dict]):
     def messages_to_dict(self, messages):
         """objects to [{"role": "user", "content": msg}] etc."""
         return [i.to_dict() for i in messages]
+
+    def with_model(self, model: str):
+        """Set model and return self. For example, `with_model("gpt-3.5-turbo")`."""
+        self.config.model = model
+        return self
+
+    def get_timeout(self, timeout: int) -> int:
+        return timeout or self.config.timeout or LLM_API_TIMEOUT
diff --git a/metagpt/provider/dashscope_api.py b/metagpt/provider/dashscope_api.py
index 21f3ef351d..82224e8939 100644
--- a/metagpt/provider/dashscope_api.py
+++ b/metagpt/provider/dashscope_api.py
@@ -25,6 +25,7 @@
     UnsupportedApiProtocol,
 )
 
+from metagpt.const import USE_CONFIG_TIMEOUT
 from metagpt.logs import log_llm_stream
 from metagpt.provider.base_llm import BaseLLM, LLMConfig
 from metagpt.provider.llm_provider_registry import LLMType, register_provider
@@ -202,16 +203,16 @@ def completion(self, messages: list[dict]) -> GenerationOutput:
         self._update_costs(dict(resp.usage))
         return resp.output
 
-    async def _achat_completion(self, messages: list[dict], timeout: int = 3) -> GenerationOutput:
+    async def _achat_completion(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> GenerationOutput:
         resp: GenerationResponse = await self.aclient.acall(**self._const_kwargs(messages, stream=False))
         self._check_response(resp)
         self._update_costs(dict(resp.usage))
         return resp.output
 
-    async def acompletion(self, messages: list[dict], timeout=3) -> GenerationOutput:
-        return await self._achat_completion(messages, timeout=timeout)
+    async def acompletion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> GenerationOutput:
+        return await self._achat_completion(messages, timeout=self.get_timeout(timeout))
 
-    async def _achat_completion_stream(self, messages: list[dict], timeout: int = 3) -> str:
+    async def _achat_completion_stream(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> str:
         resp = await self.aclient.acall(**self._const_kwargs(messages, stream=True))
         collected_content = []
         usage = {}
diff --git a/metagpt/provider/general_api_base.py b/metagpt/provider/general_api_base.py
index 1b91493966..8e5da8f161 100644
--- a/metagpt/provider/general_api_base.py
+++ b/metagpt/provider/general_api_base.py
@@ -573,7 +573,7 @@ async def arequest_raw(
                 total=request_timeout[1],
             )
         else:
-            timeout = aiohttp.ClientTimeout(total=request_timeout if request_timeout else TIMEOUT_SECS)
+            timeout = aiohttp.ClientTimeout(total=request_timeout or TIMEOUT_SECS)
 
         if files:
             # TODO: Use `aiohttp.MultipartWriter` to create the multipart form data here.
diff --git a/metagpt/provider/google_gemini_api.py b/metagpt/provider/google_gemini_api.py
index 09e5542057..e4b3a3f177 100644
--- a/metagpt/provider/google_gemini_api.py
+++ b/metagpt/provider/google_gemini_api.py
@@ -1,8 +1,10 @@
 #!/usr/bin/env python
 # -*- coding: utf-8 -*-
 # @Desc   : Google Gemini LLM from https://ai.google.dev/tutorials/python_quickstart
-
-from typing import Optional, Union
+import json
+import os
+from dataclasses import asdict
+from typing import List, Optional, Union
 
 import google.generativeai as genai
 from google.ai import generativelanguage as glm
@@ -10,14 +12,17 @@
 from google.generativeai.types import content_types
 from google.generativeai.types.generation_types import (
     AsyncGenerateContentResponse,
+    BlockedPromptException,
     GenerateContentResponse,
     GenerationConfig,
 )
 
 from metagpt.configs.llm_config import LLMConfig, LLMType
-from metagpt.logs import log_llm_stream
+from metagpt.const import USE_CONFIG_TIMEOUT
+from metagpt.logs import log_llm_stream, logger
 from metagpt.provider.base_llm import BaseLLM
 from metagpt.provider.llm_provider_registry import register_provider
+from metagpt.schema import Message
 
 
 class GeminiGenerativeModel(GenerativeModel):
@@ -51,6 +56,10 @@ def __init__(self, config: LLMConfig):
         self.llm = GeminiGenerativeModel(model_name=self.model)
 
     def __init_gemini(self, config: LLMConfig):
+        if config.proxy:
+            logger.info(f"Use proxy: {config.proxy}")
+            os.environ["http_proxy"] = config.proxy
+            os.environ["https_proxy"] = config.proxy
         genai.configure(api_key=config.api_key)
 
     def _user_msg(self, msg: str, images: Optional[Union[str, list[str]]] = None) -> dict[str, str]:
@@ -61,6 +70,35 @@ def _user_msg(self, msg: str, images: Optional[Union[str, list[str]]] = None) ->
     def _assistant_msg(self, msg: str) -> dict[str, str]:
         return {"role": "model", "parts": [msg]}
 
+    def _system_msg(self, msg: str) -> dict[str, str]:
+        return {"role": "user", "parts": [msg]}
+
+    def format_msg(self, messages: Union[str, Message, list[dict], list[Message], list[str]]) -> list[dict]:
+        """convert messages to list[dict]."""
+        from metagpt.schema import Message
+
+        if not isinstance(messages, list):
+            messages = [messages]
+
+        # REF: https://ai.google.dev/tutorials/python_quickstart
+        # As a dictionary, the message requires `role` and `parts` keys.
+        # The role in a conversation can either be the `user`, which provides the prompts,
+        # or `model`, which provides the responses.
+        processed_messages = []
+        for msg in messages:
+            if isinstance(msg, str):
+                processed_messages.append({"role": "user", "parts": [msg]})
+            elif isinstance(msg, dict):
+                assert set(msg.keys()) == set(["role", "parts"])
+                processed_messages.append(msg)
+            elif isinstance(msg, Message):
+                processed_messages.append({"role": "user" if msg.role == "user" else "model", "parts": [msg.content]})
+            else:
+                raise ValueError(
+                    f"Only support message type are: str, Message, dict, but got {type(messages).__name__}!"
+                )
+        return processed_messages
+
     def _const_kwargs(self, messages: list[dict], stream: bool = False) -> dict:
         kwargs = {"contents": messages, "generation_config": GenerationConfig(temperature=0.3), "stream": stream}
         return kwargs
@@ -88,22 +126,28 @@ def completion(self, messages: list[dict]) -> "GenerateContentResponse":
         self._update_costs(usage)
         return resp
 
-    async def _achat_completion(self, messages: list[dict], timeout: int = 3) -> "AsyncGenerateContentResponse":
+    async def _achat_completion(
+        self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT
+    ) -> "AsyncGenerateContentResponse":
         resp: AsyncGenerateContentResponse = await self.llm.generate_content_async(**self._const_kwargs(messages))
         usage = await self.aget_usage(messages, resp.text)
         self._update_costs(usage)
         return resp
 
-    async def acompletion(self, messages: list[dict], timeout=3) -> dict:
-        return await self._achat_completion(messages, timeout=timeout)
+    async def acompletion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> dict:
+        return await self._achat_completion(messages, timeout=self.get_timeout(timeout))
 
-    async def _achat_completion_stream(self, messages: list[dict], timeout: int = 3) -> str:
+    async def _achat_completion_stream(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> str:
         resp: AsyncGenerateContentResponse = await self.llm.generate_content_async(
             **self._const_kwargs(messages, stream=True)
         )
         collected_content = []
         async for chunk in resp:
-            content = chunk.text
+            try:
+                content = chunk.text
+            except Exception as e:
+                logger.warning(f"messages: {messages}\nerrors: {e}\n{BlockedPromptException(str(chunk))}")
+                raise BlockedPromptException(str(chunk))
             log_llm_stream(content)
             collected_content.append(content)
         log_llm_stream("\n")
@@ -112,3 +156,10 @@ async def _achat_completion_stream(self, messages: list[dict], timeout: int = 3)
         usage = await self.aget_usage(messages, full_content)
         self._update_costs(usage)
         return full_content
+
+    def list_models(self) -> List:
+        models = []
+        for model in genai.list_models(page_size=100):
+            models.append(asdict(model))
+        logger.info(json.dumps(models))
+        return models
diff --git a/metagpt/provider/human_provider.py b/metagpt/provider/human_provider.py
index e5f37c5b93..87dbd105fe 100644
--- a/metagpt/provider/human_provider.py
+++ b/metagpt/provider/human_provider.py
@@ -6,6 +6,7 @@
 from typing import Optional
 
 from metagpt.configs.llm_config import LLMConfig
+from metagpt.const import LLM_API_TIMEOUT, USE_CONFIG_TIMEOUT
 from metagpt.logs import logger
 from metagpt.provider.base_llm import BaseLLM
 
@@ -16,9 +17,9 @@ class HumanProvider(BaseLLM):
     """
 
     def __init__(self, config: LLMConfig):
-        pass
+        self.config = config
 
-    def ask(self, msg: str, timeout=3) -> str:
+    def ask(self, msg: str, timeout=USE_CONFIG_TIMEOUT) -> str:
         logger.info("It's your turn, please type in your response. You may also refer to the context below")
         rsp = input(msg)
         if rsp in ["exit", "quit"]:
@@ -31,20 +32,23 @@ async def aask(
         system_msgs: Optional[list[str]] = None,
         format_msgs: Optional[list[dict[str, str]]] = None,
         generator: bool = False,
-        timeout=3,
+        timeout=USE_CONFIG_TIMEOUT,
     ) -> str:
-        return self.ask(msg, timeout=timeout)
+        return self.ask(msg, timeout=self.get_timeout(timeout))
 
-    async def _achat_completion(self, messages: list[dict], timeout=3):
+    async def _achat_completion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT):
         pass
 
-    async def acompletion(self, messages: list[dict], timeout=3):
+    async def acompletion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT):
         """dummy implementation of abstract method in base"""
         return []
 
-    async def _achat_completion_stream(self, messages: list[dict], timeout: int = 3) -> str:
+    async def _achat_completion_stream(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> str:
         pass
 
-    async def acompletion_text(self, messages: list[dict], stream=False, timeout=3) -> str:
+    async def acompletion_text(self, messages: list[dict], stream=False, timeout=USE_CONFIG_TIMEOUT) -> str:
         """dummy implementation of abstract method in base"""
         return ""
+
+    def get_timeout(self, timeout: int) -> int:
+        return timeout or LLM_API_TIMEOUT
diff --git a/metagpt/provider/ollama_api.py b/metagpt/provider/ollama_api.py
index f65d7e4117..2913eb1ddb 100644
--- a/metagpt/provider/ollama_api.py
+++ b/metagpt/provider/ollama_api.py
@@ -5,7 +5,7 @@
 import json
 
 from metagpt.configs.llm_config import LLMConfig, LLMType
-from metagpt.const import LLM_API_TIMEOUT
+from metagpt.const import USE_CONFIG_TIMEOUT
 from metagpt.logs import log_llm_stream
 from metagpt.provider.base_llm import BaseLLM
 from metagpt.provider.general_api_requestor import GeneralAPIRequestor
@@ -50,28 +50,28 @@ def _decode_and_load(self, chunk: bytes, encoding: str = "utf-8") -> dict:
         chunk = chunk.decode(encoding)
         return json.loads(chunk)
 
-    async def _achat_completion(self, messages: list[dict], timeout: int = 3) -> dict:
+    async def _achat_completion(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> dict:
         resp, _, _ = await self.client.arequest(
             method=self.http_method,
             url=self.suffix_url,
             params=self._const_kwargs(messages),
-            request_timeout=LLM_API_TIMEOUT,
+            request_timeout=self.get_timeout(timeout),
         )
         resp = self._decode_and_load(resp)
         usage = self.get_usage(resp)
         self._update_costs(usage)
         return resp
 
-    async def acompletion(self, messages: list[dict], timeout=3) -> dict:
-        return await self._achat_completion(messages, timeout=timeout)
+    async def acompletion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> dict:
+        return await self._achat_completion(messages, timeout=self.get_timeout(timeout))
 
-    async def _achat_completion_stream(self, messages: list[dict], timeout: int = 3) -> str:
+    async def _achat_completion_stream(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> str:
         stream_resp, _, _ = await self.client.arequest(
             method=self.http_method,
             url=self.suffix_url,
             stream=True,
             params=self._const_kwargs(messages, stream=True),
-            request_timeout=LLM_API_TIMEOUT,
+            request_timeout=self.get_timeout(timeout),
         )
 
         collected_content = []
diff --git a/metagpt/provider/openai_api.py b/metagpt/provider/openai_api.py
index e99707ab96..dbfed72df2 100644
--- a/metagpt/provider/openai_api.py
+++ b/metagpt/provider/openai_api.py
@@ -25,16 +25,12 @@
 )
 
 from metagpt.configs.llm_config import LLMConfig, LLMType
+from metagpt.const import USE_CONFIG_TIMEOUT
 from metagpt.logs import log_llm_stream, logger
 from metagpt.provider.base_llm import BaseLLM
 from metagpt.provider.constant import GENERAL_FUNCTION_SCHEMA
 from metagpt.provider.llm_provider_registry import register_provider
-from metagpt.utils.common import (
-    CodeParser,
-    decode_image,
-    log_and_reraise,
-    process_message,
-)
+from metagpt.utils.common import CodeParser, decode_image, log_and_reraise
 from metagpt.utils.cost_manager import CostManager
 from metagpt.utils.exceptions import handle_exception
 from metagpt.utils.token_counter import (
@@ -44,7 +40,7 @@
 )
 
 
-@register_provider([LLMType.OPENAI, LLMType.FIREWORKS, LLMType.OPEN_LLM, LLMType.MOONSHOT, LLMType.MISTRAL])
+@register_provider([LLMType.OPENAI, LLMType.FIREWORKS, LLMType.OPEN_LLM, LLMType.MOONSHOT, LLMType.MISTRAL, LLMType.YI])
 class OpenAILLM(BaseLLM):
     """Check https://platform.openai.com/examples for examples"""
 
@@ -79,9 +75,9 @@ def _get_proxy_params(self) -> dict:
 
         return params
 
-    async def _achat_completion_stream(self, messages: list[dict], timeout=3) -> str:
+    async def _achat_completion_stream(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> str:
         response: AsyncStream[ChatCompletionChunk] = await self.aclient.chat.completions.create(
-            **self._cons_kwargs(messages, timeout=timeout), stream=True
+            **self._cons_kwargs(messages, timeout=self.get_timeout(timeout)), stream=True
         )
         usage = None
         collected_messages = []
@@ -109,7 +105,7 @@ async def _achat_completion_stream(self, messages: list[dict], timeout=3) -> str
         self._update_costs(usage)
         return full_reply_content
 
-    def _cons_kwargs(self, messages: list[dict], timeout=3, **extra_kwargs) -> dict:
+    def _cons_kwargs(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT, **extra_kwargs) -> dict:
         kwargs = {
             "messages": messages,
             "max_tokens": self._get_max_tokens(messages),
@@ -117,20 +113,20 @@ def _cons_kwargs(self, messages: list[dict], timeout=3, **extra_kwargs) -> dict:
             # "stop": None,  # default it's None and gpt4-v can't have this one
             "temperature": self.config.temperature,
             "model": self.model,
-            "timeout": max(self.config.timeout, timeout),
+            "timeout": self.get_timeout(timeout),
         }
         if extra_kwargs:
             kwargs.update(extra_kwargs)
         return kwargs
 
-    async def _achat_completion(self, messages: list[dict], timeout=3) -> ChatCompletion:
-        kwargs = self._cons_kwargs(messages, timeout=timeout)
+    async def _achat_completion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> ChatCompletion:
+        kwargs = self._cons_kwargs(messages, timeout=self.get_timeout(timeout))
         rsp: ChatCompletion = await self.aclient.chat.completions.create(**kwargs)
         self._update_costs(rsp.usage)
         return rsp
 
-    async def acompletion(self, messages: list[dict], timeout=3) -> ChatCompletion:
-        return await self._achat_completion(messages, timeout=timeout)
+    async def acompletion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> ChatCompletion:
+        return await self._achat_completion(messages, timeout=self.get_timeout(timeout))
 
     @retry(
         wait=wait_random_exponential(min=1, max=60),
@@ -139,24 +135,24 @@ async def acompletion(self, messages: list[dict], timeout=3) -> ChatCompletion:
         retry=retry_if_exception_type(APIConnectionError),
         retry_error_callback=log_and_reraise,
     )
-    async def acompletion_text(self, messages: list[dict], stream=False, timeout=3) -> str:
+    async def acompletion_text(self, messages: list[dict], stream=False, timeout=USE_CONFIG_TIMEOUT) -> str:
         """when streaming, print each token in place."""
         if stream:
             return await self._achat_completion_stream(messages, timeout=timeout)
 
-        rsp = await self._achat_completion(messages, timeout=timeout)
+        rsp = await self._achat_completion(messages, timeout=self.get_timeout(timeout))
         return self.get_choice_text(rsp)
 
     async def _achat_completion_function(
-        self, messages: list[dict], timeout: int = 3, **chat_configs
+        self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT, **chat_configs
     ) -> ChatCompletion:
-        messages = process_message(messages)
-        kwargs = self._cons_kwargs(messages=messages, timeout=timeout, **chat_configs)
+        messages = self.format_msg(messages)
+        kwargs = self._cons_kwargs(messages=messages, timeout=self.get_timeout(timeout), **chat_configs)
         rsp: ChatCompletion = await self.aclient.chat.completions.create(**kwargs)
         self._update_costs(rsp.usage)
         return rsp
 
-    async def aask_code(self, messages: list[dict], timeout: int = 3, **kwargs) -> dict:
+    async def aask_code(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT, **kwargs) -> dict:
         """Use function of tools to ask a code.
         Note: Keep kwargs consistent with https://platform.openai.com/docs/api-reference/chat/create
 
diff --git a/metagpt/provider/qianfan_api.py b/metagpt/provider/qianfan_api.py
index 50916fa3eb..3d78c8bfc9 100644
--- a/metagpt/provider/qianfan_api.py
+++ b/metagpt/provider/qianfan_api.py
@@ -9,6 +9,7 @@
 from qianfan.resources.typing import JsonBody
 
 from metagpt.configs.llm_config import LLMConfig, LLMType
+from metagpt.const import USE_CONFIG_TIMEOUT
 from metagpt.logs import log_llm_stream
 from metagpt.provider.base_llm import BaseLLM
 from metagpt.provider.llm_provider_registry import register_provider
@@ -107,15 +108,15 @@ def completion(self, messages: list[dict]) -> JsonBody:
         self._update_costs(resp.body.get("usage", {}))
         return resp.body
 
-    async def _achat_completion(self, messages: list[dict], timeout: int = 3) -> JsonBody:
+    async def _achat_completion(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> JsonBody:
         resp = await self.aclient.ado(**self._const_kwargs(messages=messages, stream=False))
         self._update_costs(resp.body.get("usage", {}))
         return resp.body
 
-    async def acompletion(self, messages: list[dict], timeout: int = 3) -> JsonBody:
-        return await self._achat_completion(messages, timeout=timeout)
+    async def acompletion(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> JsonBody:
+        return await self._achat_completion(messages, timeout=self.get_timeout(timeout))
 
-    async def _achat_completion_stream(self, messages: list[dict], timeout: int = 3) -> str:
+    async def _achat_completion_stream(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> str:
         resp = await self.aclient.ado(**self._const_kwargs(messages=messages, stream=True))
         collected_content = []
         usage = {}
diff --git a/metagpt/provider/spark_api.py b/metagpt/provider/spark_api.py
index 882c6ce85a..5942672599 100644
--- a/metagpt/provider/spark_api.py
+++ b/metagpt/provider/spark_api.py
@@ -17,6 +17,7 @@
 import websocket  # 使用websocket_client
 
 from metagpt.configs.llm_config import LLMConfig, LLMType
+from metagpt.const import USE_CONFIG_TIMEOUT
 from metagpt.logs import logger
 from metagpt.provider.base_llm import BaseLLM
 from metagpt.provider.llm_provider_registry import register_provider
@@ -31,19 +32,19 @@ def __init__(self, config: LLMConfig):
     def get_choice_text(self, rsp: dict) -> str:
         return rsp["payload"]["choices"]["text"][-1]["content"]
 
-    async def _achat_completion_stream(self, messages: list[dict], timeout: int = 3) -> str:
+    async def _achat_completion_stream(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> str:
         pass
 
-    async def acompletion_text(self, messages: list[dict], stream=False, timeout: int = 3) -> str:
+    async def acompletion_text(self, messages: list[dict], stream=False, timeout: int = USE_CONFIG_TIMEOUT) -> str:
         # 不支持
         # logger.warning("当前方法无法支持异步运行。当你使用acompletion时，并不能并行访问。")
         w = GetMessageFromWeb(messages, self.config)
         return w.run()
 
-    async def _achat_completion(self, messages: list[dict], timeout=3):
+    async def _achat_completion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT):
         pass
 
-    async def acompletion(self, messages: list[dict], timeout=3):
+    async def acompletion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT):
         # 不支持异步
         w = GetMessageFromWeb(messages, self.config)
         return w.run()
diff --git a/metagpt/provider/zhipuai_api.py b/metagpt/provider/zhipuai_api.py
index 14ad1a36b3..acac44aaf0 100644
--- a/metagpt/provider/zhipuai_api.py
+++ b/metagpt/provider/zhipuai_api.py
@@ -8,6 +8,7 @@
 from zhipuai.types.chat.chat_completion import Completion
 
 from metagpt.configs.llm_config import LLMConfig, LLMType
+from metagpt.const import USE_CONFIG_TIMEOUT
 from metagpt.logs import log_llm_stream
 from metagpt.provider.base_llm import BaseLLM
 from metagpt.provider.llm_provider_registry import register_provider
@@ -42,25 +43,33 @@ def __init_zhipuai(self):
         self.llm = ZhiPuModelAPI(api_key=self.api_key)
 
     def _const_kwargs(self, messages: list[dict], stream: bool = False) -> dict:
-        kwargs = {"model": self.model, "messages": messages, "stream": stream, "temperature": 0.3}
+        max_tokens = self.config.max_token if self.config.max_token > 0 else 1024
+        temperature = self.config.temperature if self.config.temperature > 0.0 else 0.3
+        kwargs = {
+            "model": self.model,
+            "max_tokens": max_tokens,
+            "messages": messages,
+            "stream": stream,
+            "temperature": temperature,
+        }
         return kwargs
 
-    def completion(self, messages: list[dict], timeout=3) -> dict:
+    def completion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> dict:
         resp: Completion = self.llm.chat.completions.create(**self._const_kwargs(messages))
         usage = resp.usage.model_dump()
         self._update_costs(usage)
         return resp.model_dump()
 
-    async def _achat_completion(self, messages: list[dict], timeout=3) -> dict:
+    async def _achat_completion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> dict:
         resp = await self.llm.acreate(**self._const_kwargs(messages))
         usage = resp.get("usage", {})
         self._update_costs(usage)
         return resp
 
-    async def acompletion(self, messages: list[dict], timeout=3) -> dict:
-        return await self._achat_completion(messages, timeout=timeout)
+    async def acompletion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> dict:
+        return await self._achat_completion(messages, timeout=self.get_timeout(timeout))
 
-    async def _achat_completion_stream(self, messages: list[dict], timeout=3) -> str:
+    async def _achat_completion_stream(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> str:
         response = await self.llm.acreate_stream(**self._const_kwargs(messages, stream=True))
         collected_content = []
         usage = {}
diff --git a/metagpt/rag/__init__.py b/metagpt/rag/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/metagpt/rag/engines/__init__.py b/metagpt/rag/engines/__init__.py
new file mode 100644
index 0000000000..93699db884
--- /dev/null
+++ b/metagpt/rag/engines/__init__.py
@@ -0,0 +1,6 @@
+"""Engines init"""
+
+from metagpt.rag.engines.simple import SimpleEngine
+from metagpt.rag.engines.flare import FLAREEngine
+
+__all__ = ["SimpleEngine", "FLAREEngine"]
diff --git a/metagpt/rag/engines/flare.py b/metagpt/rag/engines/flare.py
new file mode 100644
index 0000000000..dc05bd3dde
--- /dev/null
+++ b/metagpt/rag/engines/flare.py
@@ -0,0 +1,9 @@
+"""FLARE Engine.
+
+Use llamaindex's FLAREInstructQueryEngine as FLAREEngine, which accepts other engines as parameters.
+For example, Create a simple engine, and then pass it to FLAREEngine.
+"""
+
+from llama_index.core.query_engine import (  # noqa: F401
+    FLAREInstructQueryEngine as FLAREEngine,
+)
diff --git a/metagpt/rag/engines/simple.py b/metagpt/rag/engines/simple.py
new file mode 100644
index 0000000000..34f925249a
--- /dev/null
+++ b/metagpt/rag/engines/simple.py
@@ -0,0 +1,268 @@
+"""Simple Engine."""
+
+import json
+import os
+from typing import Any, Optional, Union
+
+from llama_index.core import SimpleDirectoryReader, VectorStoreIndex
+from llama_index.core.callbacks.base import CallbackManager
+from llama_index.core.embeddings import BaseEmbedding
+from llama_index.core.embeddings.mock_embed_model import MockEmbedding
+from llama_index.core.indices.base import BaseIndex
+from llama_index.core.ingestion.pipeline import run_transformations
+from llama_index.core.llms import LLM
+from llama_index.core.node_parser import SentenceSplitter
+from llama_index.core.postprocessor.types import BaseNodePostprocessor
+from llama_index.core.query_engine import RetrieverQueryEngine
+from llama_index.core.response_synthesizers import (
+    BaseSynthesizer,
+    get_response_synthesizer,
+)
+from llama_index.core.retrievers import BaseRetriever
+from llama_index.core.schema import (
+    BaseNode,
+    Document,
+    NodeWithScore,
+    QueryBundle,
+    QueryType,
+    TransformComponent,
+)
+
+from metagpt.rag.factories import (
+    get_index,
+    get_rag_embedding,
+    get_rag_llm,
+    get_rankers,
+    get_retriever,
+)
+from metagpt.rag.interface import NoEmbedding, RAGObject
+from metagpt.rag.retrievers.base import ModifiableRAGRetriever, PersistableRAGRetriever
+from metagpt.rag.retrievers.hybrid_retriever import SimpleHybridRetriever
+from metagpt.rag.schema import (
+    BaseIndexConfig,
+    BaseRankerConfig,
+    BaseRetrieverConfig,
+    BM25RetrieverConfig,
+    ObjectNode,
+)
+from metagpt.utils.common import import_class
+
+
+class SimpleEngine(RetrieverQueryEngine):
+    """SimpleEngine is designed to be simple and straightforward.
+
+    It is a lightweight and easy-to-use search engine that integrates
+    document reading, embedding, indexing, retrieving, and ranking functionalities
+    into a single, straightforward workflow. It is designed to quickly set up a
+    search engine from a collection of documents.
+    """
+
+    def __init__(
+        self,
+        retriever: BaseRetriever,
+        response_synthesizer: Optional[BaseSynthesizer] = None,
+        node_postprocessors: Optional[list[BaseNodePostprocessor]] = None,
+        callback_manager: Optional[CallbackManager] = None,
+        index: Optional[BaseIndex] = None,
+    ) -> None:
+        super().__init__(
+            retriever=retriever,
+            response_synthesizer=response_synthesizer,
+            node_postprocessors=node_postprocessors,
+            callback_manager=callback_manager,
+        )
+        self.index = index
+
+    @classmethod
+    def from_docs(
+        cls,
+        input_dir: str = None,
+        input_files: list[str] = None,
+        transformations: Optional[list[TransformComponent]] = None,
+        embed_model: BaseEmbedding = None,
+        llm: LLM = None,
+        retriever_configs: list[BaseRetrieverConfig] = None,
+        ranker_configs: list[BaseRankerConfig] = None,
+    ) -> "SimpleEngine":
+        """From docs.
+
+        Must provide either `input_dir` or `input_files`.
+
+        Args:
+            input_dir: Path to the directory.
+            input_files: List of file paths to read (Optional; overrides input_dir, exclude).
+            transformations: Parse documents to nodes. Default [SentenceSplitter].
+            embed_model: Parse nodes to embedding. Must supported by llama index. Default OpenAIEmbedding.
+            llm: Must supported by llama index. Default OpenAI.
+            retriever_configs: Configuration for retrievers. If more than one config, will use SimpleHybridRetriever.
+            ranker_configs: Configuration for rankers.
+        """
+        if not input_dir and not input_files:
+            raise ValueError("Must provide either `input_dir` or `input_files`.")
+
+        documents = SimpleDirectoryReader(input_dir=input_dir, input_files=input_files).load_data()
+        cls._fix_document_metadata(documents)
+
+        index = VectorStoreIndex.from_documents(
+            documents=documents,
+            transformations=transformations or [SentenceSplitter()],
+            embed_model=cls._resolve_embed_model(embed_model, retriever_configs),
+        )
+        return cls._from_index(index, llm=llm, retriever_configs=retriever_configs, ranker_configs=ranker_configs)
+
+    @classmethod
+    def from_objs(
+        cls,
+        objs: Optional[list[RAGObject]] = None,
+        transformations: Optional[list[TransformComponent]] = None,
+        embed_model: BaseEmbedding = None,
+        llm: LLM = None,
+        retriever_configs: list[BaseRetrieverConfig] = None,
+        ranker_configs: list[BaseRankerConfig] = None,
+    ) -> "SimpleEngine":
+        """From objs.
+
+        Args:
+            objs: List of RAGObject.
+            transformations: Parse documents to nodes. Default [SentenceSplitter].
+            embed_model: Parse nodes to embedding. Must supported by llama index. Default OpenAIEmbedding.
+            llm: Must supported by llama index. Default OpenAI.
+            retriever_configs: Configuration for retrievers. If more than one config, will use SimpleHybridRetriever.
+            ranker_configs: Configuration for rankers.
+        """
+        objs = objs or []
+        retriever_configs = retriever_configs or []
+
+        if not objs and any(isinstance(config, BM25RetrieverConfig) for config in retriever_configs):
+            raise ValueError("In BM25RetrieverConfig, Objs must not be empty.")
+
+        nodes = [ObjectNode(text=obj.rag_key(), metadata=ObjectNode.get_obj_metadata(obj)) for obj in objs]
+        index = VectorStoreIndex(
+            nodes=nodes,
+            transformations=transformations or [SentenceSplitter()],
+            embed_model=cls._resolve_embed_model(embed_model, retriever_configs),
+        )
+        return cls._from_index(index, llm=llm, retriever_configs=retriever_configs, ranker_configs=ranker_configs)
+
+    @classmethod
+    def from_index(
+        cls,
+        index_config: BaseIndexConfig,
+        embed_model: BaseEmbedding = None,
+        llm: LLM = None,
+        retriever_configs: list[BaseRetrieverConfig] = None,
+        ranker_configs: list[BaseRankerConfig] = None,
+    ) -> "SimpleEngine":
+        """Load from previously maintained index by self.persist(), index_config contains persis_path."""
+        index = get_index(index_config, embed_model=cls._resolve_embed_model(embed_model, [index_config]))
+        return cls._from_index(index, llm=llm, retriever_configs=retriever_configs, ranker_configs=ranker_configs)
+
+    async def asearch(self, content: str, **kwargs) -> str:
+        """Inplement tools.SearchInterface"""
+        return await self.aquery(content)
+
+    def retrieve(self, query: QueryType) -> list[NodeWithScore]:
+        query_bundle = QueryBundle(query) if isinstance(query, str) else query
+
+        nodes = super().retrieve(query_bundle)
+        self._try_reconstruct_obj(nodes)
+        return nodes
+
+    async def aretrieve(self, query: QueryType) -> list[NodeWithScore]:
+        """Allow query to be str."""
+        query_bundle = QueryBundle(query) if isinstance(query, str) else query
+
+        nodes = await super().aretrieve(query_bundle)
+        self._try_reconstruct_obj(nodes)
+        return nodes
+
+    def add_docs(self, input_files: list[str]):
+        """Add docs to retriever. retriever must has add_nodes func."""
+        self._ensure_retriever_modifiable()
+
+        documents = SimpleDirectoryReader(input_files=input_files).load_data()
+        self._fix_document_metadata(documents)
+
+        nodes = run_transformations(documents, transformations=self.index._transformations)
+        self._save_nodes(nodes)
+
+    def add_objs(self, objs: list[RAGObject]):
+        """Adds objects to the retriever, storing each object's original form in metadata for future reference."""
+        self._ensure_retriever_modifiable()
+
+        nodes = [ObjectNode(text=obj.rag_key(), metadata=ObjectNode.get_obj_metadata(obj)) for obj in objs]
+        self._save_nodes(nodes)
+
+    def persist(self, persist_dir: Union[str, os.PathLike], **kwargs):
+        """Persist."""
+        self._ensure_retriever_persistable()
+
+        self._persist(str(persist_dir), **kwargs)
+
+    @classmethod
+    def _from_index(
+        cls,
+        index: BaseIndex,
+        llm: LLM = None,
+        retriever_configs: list[BaseRetrieverConfig] = None,
+        ranker_configs: list[BaseRankerConfig] = None,
+    ) -> "SimpleEngine":
+        llm = llm or get_rag_llm()
+        retriever = get_retriever(configs=retriever_configs, index=index)  # Default index.as_retriever
+        rankers = get_rankers(configs=ranker_configs, llm=llm)  # Default []
+
+        return cls(
+            retriever=retriever,
+            node_postprocessors=rankers,
+            response_synthesizer=get_response_synthesizer(llm=llm),
+            index=index,
+        )
+
+    def _ensure_retriever_modifiable(self):
+        self._ensure_retriever_of_type(ModifiableRAGRetriever)
+
+    def _ensure_retriever_persistable(self):
+        self._ensure_retriever_of_type(PersistableRAGRetriever)
+
+    def _ensure_retriever_of_type(self, required_type: BaseRetriever):
+        """Ensure that self.retriever is required_type, or at least one of its components, if it's a SimpleHybridRetriever.
+
+        Args:
+            required_type: The class that the retriever is expected to be an instance of.
+        """
+        if isinstance(self.retriever, SimpleHybridRetriever):
+            if not any(isinstance(r, required_type) for r in self.retriever.retrievers):
+                raise TypeError(
+                    f"Must have at least one retriever of type {required_type.__name__} in SimpleHybridRetriever"
+                )
+
+        if not isinstance(self.retriever, required_type):
+            raise TypeError(f"The retriever is not of type {required_type.__name__}: {type(self.retriever)}")
+
+    def _save_nodes(self, nodes: list[BaseNode]):
+        self.retriever.add_nodes(nodes)
+
+    def _persist(self, persist_dir: str, **kwargs):
+        self.retriever.persist(persist_dir, **kwargs)
+
+    @staticmethod
+    def _try_reconstruct_obj(nodes: list[NodeWithScore]):
+        """If node is object, then dynamically reconstruct object, and save object to node.metadata["obj"]."""
+        for node in nodes:
+            if node.metadata.get("is_obj", False):
+                obj_cls = import_class(node.metadata["obj_cls_name"], node.metadata["obj_mod_name"])
+                obj_dict = json.loads(node.metadata["obj_json"])
+                node.metadata["obj"] = obj_cls(**obj_dict)
+
+    @staticmethod
+    def _fix_document_metadata(documents: list[Document]):
+        """LlamaIndex keep metadata['file_path'], which is unnecessary, maybe deleted in the near future."""
+        for doc in documents:
+            doc.excluded_embed_metadata_keys.append("file_path")
+
+    @staticmethod
+    def _resolve_embed_model(embed_model: BaseEmbedding = None, configs: list[Any] = None) -> BaseEmbedding:
+        if configs and all(isinstance(c, NoEmbedding) for c in configs):
+            return MockEmbedding(embed_dim=1)
+
+        return embed_model or get_rag_embedding()
diff --git a/metagpt/rag/factories/__init__.py b/metagpt/rag/factories/__init__.py
new file mode 100644
index 0000000000..caa35405f4
--- /dev/null
+++ b/metagpt/rag/factories/__init__.py
@@ -0,0 +1,9 @@
+"""RAG factories"""
+
+from metagpt.rag.factories.retriever import get_retriever
+from metagpt.rag.factories.ranker import get_rankers
+from metagpt.rag.factories.embedding import get_rag_embedding
+from metagpt.rag.factories.index import get_index
+from metagpt.rag.factories.llm import get_rag_llm
+
+__all__ = ["get_retriever", "get_rankers", "get_rag_embedding", "get_index", "get_rag_llm"]
diff --git a/metagpt/rag/factories/base.py b/metagpt/rag/factories/base.py
new file mode 100644
index 0000000000..fcfec03ecc
--- /dev/null
+++ b/metagpt/rag/factories/base.py
@@ -0,0 +1,62 @@
+"""Base Factory."""
+
+from typing import Any, Callable
+
+
+class GenericFactory:
+    """Designed to get objects based on any keys."""
+
+    def __init__(self, creators: dict[Any, Callable] = None):
+        """Creators is a dictionary.
+
+        Keys are identifiers, and the values are the associated creator function, which create objects.
+        """
+        self._creators = creators or {}
+
+    def get_instances(self, keys: list[Any], **kwargs) -> list[Any]:
+        """Get instances by keys."""
+        return [self.get_instance(key, **kwargs) for key in keys]
+
+    def get_instance(self, key: Any, **kwargs) -> Any:
+        """Get instance by key.
+
+        Raise Exception if key not found.
+        """
+        creator = self._creators.get(key)
+        if creator:
+            return creator(**kwargs)
+
+        self._raise_for_key(key)
+
+    def _raise_for_key(self, key: Any):
+        raise ValueError(f"Creator not registered for key: {key}")
+
+
+class ConfigBasedFactory(GenericFactory):
+    """Designed to get objects based on object type."""
+
+    def get_instance(self, key: Any, **kwargs) -> Any:
+        """Key is config, such as a pydantic model.
+
+        Call func by the type of key, and the key will be passed to func.
+        """
+        creator = self._creators.get(type(key))
+        if creator:
+            return creator(key, **kwargs)
+
+        raise ValueError(f"Unknown config: `{type(key)}`, {key}")
+
+    @staticmethod
+    def _val_from_config_or_kwargs(key: str, config: object = None, **kwargs) -> Any:
+        """It prioritizes the configuration object's value unless it is None, in which case it looks into kwargs."""
+        if config is not None and hasattr(config, key):
+            val = getattr(config, key)
+            if val is not None:
+                return val
+
+        if key in kwargs:
+            return kwargs[key]
+
+        raise KeyError(
+            f"The key '{key}' is required but not provided in either configuration object or keyword arguments."
+        )
diff --git a/metagpt/rag/factories/embedding.py b/metagpt/rag/factories/embedding.py
new file mode 100644
index 0000000000..3613fd228f
--- /dev/null
+++ b/metagpt/rag/factories/embedding.py
@@ -0,0 +1,103 @@
+"""RAG Embedding Factory."""
+from __future__ import annotations
+
+from typing import Any
+
+from llama_index.core.embeddings import BaseEmbedding
+from llama_index.embeddings.azure_openai import AzureOpenAIEmbedding
+from llama_index.embeddings.gemini import GeminiEmbedding
+from llama_index.embeddings.ollama import OllamaEmbedding
+from llama_index.embeddings.openai import OpenAIEmbedding
+
+from metagpt.config2 import config
+from metagpt.configs.embedding_config import EmbeddingType
+from metagpt.configs.llm_config import LLMType
+from metagpt.rag.factories.base import GenericFactory
+
+
+class RAGEmbeddingFactory(GenericFactory):
+    """Create LlamaIndex Embedding with MetaGPT's embedding config."""
+
+    def __init__(self):
+        creators = {
+            EmbeddingType.OPENAI: self._create_openai,
+            EmbeddingType.AZURE: self._create_azure,
+            EmbeddingType.GEMINI: self._create_gemini,
+            EmbeddingType.OLLAMA: self._create_ollama,
+            # For backward compatibility
+            LLMType.OPENAI: self._create_openai,
+            LLMType.AZURE: self._create_azure,
+        }
+        super().__init__(creators)
+
+    def get_rag_embedding(self, key: EmbeddingType = None) -> BaseEmbedding:
+        """Key is EmbeddingType."""
+        return super().get_instance(key or self._resolve_embedding_type())
+
+    def _resolve_embedding_type(self) -> EmbeddingType | LLMType:
+        """Resolves the embedding type.
+
+        If the embedding type is not specified, for backward compatibility, it checks if the LLM API type is either OPENAI or AZURE.
+        Raise TypeError if embedding type not found.
+        """
+        if config.embedding.api_type:
+            return config.embedding.api_type
+
+        if config.llm.api_type in [LLMType.OPENAI, LLMType.AZURE]:
+            return config.llm.api_type
+
+        raise TypeError("To use RAG, please set your embedding in config2.yaml.")
+
+    def _create_openai(self) -> OpenAIEmbedding:
+        params = dict(
+            api_key=config.embedding.api_key or config.llm.api_key,
+            api_base=config.embedding.base_url or config.llm.base_url,
+        )
+
+        self._try_set_model_and_batch_size(params)
+
+        return OpenAIEmbedding(**params)
+
+    def _create_azure(self) -> AzureOpenAIEmbedding:
+        params = dict(
+            api_key=config.embedding.api_key or config.llm.api_key,
+            azure_endpoint=config.embedding.base_url or config.llm.base_url,
+            api_version=config.embedding.api_version or config.llm.api_version,
+        )
+
+        self._try_set_model_and_batch_size(params)
+
+        return AzureOpenAIEmbedding(**params)
+
+    def _create_gemini(self) -> GeminiEmbedding:
+        params = dict(
+            api_key=config.embedding.api_key,
+            api_base=config.embedding.base_url,
+        )
+
+        self._try_set_model_and_batch_size(params)
+
+        return GeminiEmbedding(**params)
+
+    def _create_ollama(self) -> OllamaEmbedding:
+        params = dict(
+            base_url=config.embedding.base_url,
+        )
+
+        self._try_set_model_and_batch_size(params)
+
+        return OllamaEmbedding(**params)
+
+    def _try_set_model_and_batch_size(self, params: dict):
+        """Set the model_name and embed_batch_size only when they are specified."""
+        if config.embedding.model:
+            params["model_name"] = config.embedding.model
+
+        if config.embedding.embed_batch_size:
+            params["embed_batch_size"] = config.embedding.embed_batch_size
+
+    def _raise_for_key(self, key: Any):
+        raise ValueError(f"The embedding type is currently not supported: `{type(key)}`, {key}")
+
+
+get_rag_embedding = RAGEmbeddingFactory().get_rag_embedding
diff --git a/metagpt/rag/factories/index.py b/metagpt/rag/factories/index.py
new file mode 100644
index 0000000000..f897af3ad0
--- /dev/null
+++ b/metagpt/rag/factories/index.py
@@ -0,0 +1,82 @@
+"""RAG Index Factory."""
+
+import chromadb
+from llama_index.core import StorageContext, VectorStoreIndex, load_index_from_storage
+from llama_index.core.embeddings import BaseEmbedding
+from llama_index.core.indices.base import BaseIndex
+from llama_index.core.vector_stores.types import BasePydanticVectorStore
+from llama_index.vector_stores.chroma import ChromaVectorStore
+from llama_index.vector_stores.elasticsearch import ElasticsearchStore
+from llama_index.vector_stores.faiss import FaissVectorStore
+
+from metagpt.rag.factories.base import ConfigBasedFactory
+from metagpt.rag.schema import (
+    BaseIndexConfig,
+    BM25IndexConfig,
+    ChromaIndexConfig,
+    ElasticsearchIndexConfig,
+    ElasticsearchKeywordIndexConfig,
+    FAISSIndexConfig,
+)
+
+
+class RAGIndexFactory(ConfigBasedFactory):
+    def __init__(self):
+        creators = {
+            FAISSIndexConfig: self._create_faiss,
+            ChromaIndexConfig: self._create_chroma,
+            BM25IndexConfig: self._create_bm25,
+            ElasticsearchIndexConfig: self._create_es,
+            ElasticsearchKeywordIndexConfig: self._create_es,
+        }
+        super().__init__(creators)
+
+    def get_index(self, config: BaseIndexConfig, **kwargs) -> BaseIndex:
+        """Key is PersistType."""
+        return super().get_instance(config, **kwargs)
+
+    def _create_faiss(self, config: FAISSIndexConfig, **kwargs) -> VectorStoreIndex:
+        vector_store = FaissVectorStore.from_persist_dir(str(config.persist_path))
+        storage_context = StorageContext.from_defaults(vector_store=vector_store, persist_dir=config.persist_path)
+
+        return self._index_from_storage(storage_context=storage_context, config=config, **kwargs)
+
+    def _create_bm25(self, config: BM25IndexConfig, **kwargs) -> VectorStoreIndex:
+        storage_context = StorageContext.from_defaults(persist_dir=config.persist_path)
+
+        return self._index_from_storage(storage_context=storage_context, config=config, **kwargs)
+
+    def _create_chroma(self, config: ChromaIndexConfig, **kwargs) -> VectorStoreIndex:
+        db = chromadb.PersistentClient(str(config.persist_path))
+        chroma_collection = db.get_or_create_collection(config.collection_name, metadata=config.metadata)
+        vector_store = ChromaVectorStore(chroma_collection=chroma_collection)
+
+        return self._index_from_vector_store(vector_store=vector_store, config=config, **kwargs)
+
+    def _create_es(self, config: ElasticsearchIndexConfig, **kwargs) -> VectorStoreIndex:
+        vector_store = ElasticsearchStore(**config.store_config.model_dump())
+
+        return self._index_from_vector_store(vector_store=vector_store, config=config, **kwargs)
+
+    def _index_from_storage(
+        self, storage_context: StorageContext, config: BaseIndexConfig, **kwargs
+    ) -> VectorStoreIndex:
+        embed_model = self._extract_embed_model(config, **kwargs)
+
+        return load_index_from_storage(storage_context=storage_context, embed_model=embed_model)
+
+    def _index_from_vector_store(
+        self, vector_store: BasePydanticVectorStore, config: BaseIndexConfig, **kwargs
+    ) -> VectorStoreIndex:
+        embed_model = self._extract_embed_model(config, **kwargs)
+
+        return VectorStoreIndex.from_vector_store(
+            vector_store=vector_store,
+            embed_model=embed_model,
+        )
+
+    def _extract_embed_model(self, config, **kwargs) -> BaseEmbedding:
+        return self._val_from_config_or_kwargs("embed_model", config, **kwargs)
+
+
+get_index = RAGIndexFactory().get_index
diff --git a/metagpt/rag/factories/llm.py b/metagpt/rag/factories/llm.py
new file mode 100644
index 0000000000..9fd19cab50
--- /dev/null
+++ b/metagpt/rag/factories/llm.py
@@ -0,0 +1,57 @@
+"""RAG LLM."""
+import asyncio
+from typing import Any
+
+from llama_index.core.constants import DEFAULT_CONTEXT_WINDOW
+from llama_index.core.llms import (
+    CompletionResponse,
+    CompletionResponseGen,
+    CustomLLM,
+    LLMMetadata,
+)
+from llama_index.core.llms.callbacks import llm_completion_callback
+from pydantic import Field
+
+from metagpt.config2 import config
+from metagpt.llm import LLM
+from metagpt.provider.base_llm import BaseLLM
+from metagpt.utils.async_helper import NestAsyncio
+from metagpt.utils.token_counter import TOKEN_MAX
+
+
+class RAGLLM(CustomLLM):
+    """LlamaIndex's LLM is different from MetaGPT's LLM.
+
+    Inherit CustomLLM from llamaindex, making MetaGPT's LLM can be used by LlamaIndex.
+    """
+
+    model_infer: BaseLLM = Field(..., description="The MetaGPT's LLM.")
+    context_window: int = TOKEN_MAX.get(config.llm.model, DEFAULT_CONTEXT_WINDOW)
+    num_output: int = config.llm.max_token
+    model_name: str = config.llm.model
+
+    @property
+    def metadata(self) -> LLMMetadata:
+        """Get LLM metadata."""
+        return LLMMetadata(
+            context_window=self.context_window, num_output=self.num_output, model_name=self.model_name or "unknown"
+        )
+
+    @llm_completion_callback()
+    def complete(self, prompt: str, **kwargs: Any) -> CompletionResponse:
+        NestAsyncio.apply_once()
+        return asyncio.get_event_loop().run_until_complete(self.acomplete(prompt, **kwargs))
+
+    @llm_completion_callback()
+    async def acomplete(self, prompt: str, formatted: bool = False, **kwargs: Any) -> CompletionResponse:
+        text = await self.model_infer.aask(msg=prompt, stream=False)
+        return CompletionResponse(text=text)
+
+    @llm_completion_callback()
+    def stream_complete(self, prompt: str, **kwargs: Any) -> CompletionResponseGen:
+        ...
+
+
+def get_rag_llm(model_infer: BaseLLM = None) -> RAGLLM:
+    """Get llm that can be used by LlamaIndex."""
+    return RAGLLM(model_infer=model_infer or LLM())
diff --git a/metagpt/rag/factories/ranker.py b/metagpt/rag/factories/ranker.py
new file mode 100644
index 0000000000..476fe8c1a6
--- /dev/null
+++ b/metagpt/rag/factories/ranker.py
@@ -0,0 +1,55 @@
+"""RAG Ranker Factory."""
+
+from llama_index.core.llms import LLM
+from llama_index.core.postprocessor import LLMRerank
+from llama_index.core.postprocessor.types import BaseNodePostprocessor
+
+from metagpt.rag.factories.base import ConfigBasedFactory
+from metagpt.rag.rankers.object_ranker import ObjectSortPostprocessor
+from metagpt.rag.schema import (
+    BaseRankerConfig,
+    ColbertRerankConfig,
+    LLMRankerConfig,
+    ObjectRankerConfig,
+)
+
+
+class RankerFactory(ConfigBasedFactory):
+    """Modify creators for dynamically instance implementation."""
+
+    def __init__(self):
+        creators = {
+            LLMRankerConfig: self._create_llm_ranker,
+            ColbertRerankConfig: self._create_colbert_ranker,
+            ObjectRankerConfig: self._create_object_ranker,
+        }
+        super().__init__(creators)
+
+    def get_rankers(self, configs: list[BaseRankerConfig] = None, **kwargs) -> list[BaseNodePostprocessor]:
+        """Creates and returns a retriever instance based on the provided configurations."""
+        if not configs:
+            return []
+
+        return super().get_instances(configs, **kwargs)
+
+    def _create_llm_ranker(self, config: LLMRankerConfig, **kwargs) -> LLMRerank:
+        config.llm = self._extract_llm(config, **kwargs)
+        return LLMRerank(**config.model_dump())
+
+    def _create_colbert_ranker(self, config: ColbertRerankConfig, **kwargs) -> LLMRerank:
+        try:
+            from llama_index.postprocessor.colbert_rerank import ColbertRerank
+        except ImportError:
+            raise ImportError(
+                "`llama-index-postprocessor-colbert-rerank` package not found, please run `pip install llama-index-postprocessor-colbert-rerank`"
+            )
+        return ColbertRerank(**config.model_dump())
+
+    def _create_object_ranker(self, config: ObjectRankerConfig, **kwargs) -> LLMRerank:
+        return ObjectSortPostprocessor(**config.model_dump())
+
+    def _extract_llm(self, config: BaseRankerConfig = None, **kwargs) -> LLM:
+        return self._val_from_config_or_kwargs("llm", config, **kwargs)
+
+
+get_rankers = RankerFactory().get_rankers
diff --git a/metagpt/rag/factories/retriever.py b/metagpt/rag/factories/retriever.py
new file mode 100644
index 0000000000..68f2c23133
--- /dev/null
+++ b/metagpt/rag/factories/retriever.py
@@ -0,0 +1,101 @@
+"""RAG Retriever Factory."""
+
+import copy
+
+import chromadb
+import faiss
+from llama_index.core import StorageContext, VectorStoreIndex
+from llama_index.core.vector_stores.types import BasePydanticVectorStore
+from llama_index.vector_stores.chroma import ChromaVectorStore
+from llama_index.vector_stores.elasticsearch import ElasticsearchStore
+from llama_index.vector_stores.faiss import FaissVectorStore
+
+from metagpt.rag.factories.base import ConfigBasedFactory
+from metagpt.rag.retrievers.base import RAGRetriever
+from metagpt.rag.retrievers.bm25_retriever import DynamicBM25Retriever
+from metagpt.rag.retrievers.chroma_retriever import ChromaRetriever
+from metagpt.rag.retrievers.es_retriever import ElasticsearchRetriever
+from metagpt.rag.retrievers.faiss_retriever import FAISSRetriever
+from metagpt.rag.retrievers.hybrid_retriever import SimpleHybridRetriever
+from metagpt.rag.schema import (
+    BaseRetrieverConfig,
+    BM25RetrieverConfig,
+    ChromaRetrieverConfig,
+    ElasticsearchKeywordRetrieverConfig,
+    ElasticsearchRetrieverConfig,
+    FAISSRetrieverConfig,
+    IndexRetrieverConfig,
+)
+
+
+class RetrieverFactory(ConfigBasedFactory):
+    """Modify creators for dynamically instance implementation."""
+
+    def __init__(self):
+        creators = {
+            FAISSRetrieverConfig: self._create_faiss_retriever,
+            BM25RetrieverConfig: self._create_bm25_retriever,
+            ChromaRetrieverConfig: self._create_chroma_retriever,
+            ElasticsearchRetrieverConfig: self._create_es_retriever,
+            ElasticsearchKeywordRetrieverConfig: self._create_es_retriever,
+        }
+        super().__init__(creators)
+
+    def get_retriever(self, configs: list[BaseRetrieverConfig] = None, **kwargs) -> RAGRetriever:
+        """Creates and returns a retriever instance based on the provided configurations.
+
+        If multiple retrievers, using SimpleHybridRetriever.
+        """
+        if not configs:
+            return self._create_default(**kwargs)
+
+        retrievers = super().get_instances(configs, **kwargs)
+
+        return SimpleHybridRetriever(*retrievers) if len(retrievers) > 1 else retrievers[0]
+
+    def _create_default(self, **kwargs) -> RAGRetriever:
+        return self._extract_index(**kwargs).as_retriever()
+
+    def _create_faiss_retriever(self, config: FAISSRetrieverConfig, **kwargs) -> FAISSRetriever:
+        vector_store = FaissVectorStore(faiss_index=faiss.IndexFlatL2(config.dimensions))
+        config.index = self._build_index_from_vector_store(config, vector_store, **kwargs)
+
+        return FAISSRetriever(**config.model_dump())
+
+    def _create_bm25_retriever(self, config: BM25RetrieverConfig, **kwargs) -> DynamicBM25Retriever:
+        config.index = copy.deepcopy(self._extract_index(config, **kwargs))
+
+        return DynamicBM25Retriever(nodes=list(config.index.docstore.docs.values()), **config.model_dump())
+
+    def _create_chroma_retriever(self, config: ChromaRetrieverConfig, **kwargs) -> ChromaRetriever:
+        db = chromadb.PersistentClient(path=str(config.persist_path))
+        chroma_collection = db.get_or_create_collection(config.collection_name, metadata=config.metadata)
+
+        vector_store = ChromaVectorStore(chroma_collection=chroma_collection)
+        config.index = self._build_index_from_vector_store(config, vector_store, **kwargs)
+
+        return ChromaRetriever(**config.model_dump())
+
+    def _create_es_retriever(self, config: ElasticsearchRetrieverConfig, **kwargs) -> ElasticsearchRetriever:
+        vector_store = ElasticsearchStore(**config.store_config.model_dump())
+        config.index = self._build_index_from_vector_store(config, vector_store, **kwargs)
+
+        return ElasticsearchRetriever(**config.model_dump())
+
+    def _extract_index(self, config: BaseRetrieverConfig = None, **kwargs) -> VectorStoreIndex:
+        return self._val_from_config_or_kwargs("index", config, **kwargs)
+
+    def _build_index_from_vector_store(
+        self, config: IndexRetrieverConfig, vector_store: BasePydanticVectorStore, **kwargs
+    ) -> VectorStoreIndex:
+        storage_context = StorageContext.from_defaults(vector_store=vector_store)
+        old_index = self._extract_index(config, **kwargs)
+        new_index = VectorStoreIndex(
+            nodes=list(old_index.docstore.docs.values()),
+            storage_context=storage_context,
+            embed_model=old_index._embed_model,
+        )
+        return new_index
+
+
+get_retriever = RetrieverFactory().get_retriever
diff --git a/metagpt/rag/interface.py b/metagpt/rag/interface.py
new file mode 100644
index 0000000000..867605edc2
--- /dev/null
+++ b/metagpt/rag/interface.py
@@ -0,0 +1,24 @@
+"""RAG Interfaces."""
+
+from typing import Protocol, runtime_checkable
+
+
+@runtime_checkable
+class RAGObject(Protocol):
+    """Support rag add object."""
+
+    def rag_key(self) -> str:
+        """For rag search."""
+
+    def model_dump_json(self) -> str:
+        """For rag persist.
+
+        Pydantic Model don't need to implement this, as there is a built-in function named model_dump_json.
+        """
+
+
+@runtime_checkable
+class NoEmbedding(Protocol):
+    """Some retriever does not require embeddings, e.g. BM25"""
+
+    _no_embedding: bool
diff --git a/metagpt/rag/rankers/__init__.py b/metagpt/rag/rankers/__init__.py
new file mode 100644
index 0000000000..82743487c9
--- /dev/null
+++ b/metagpt/rag/rankers/__init__.py
@@ -0,0 +1 @@
+"""Rankers init"""
diff --git a/metagpt/rag/rankers/base.py b/metagpt/rag/rankers/base.py
new file mode 100644
index 0000000000..a533a8b90b
--- /dev/null
+++ b/metagpt/rag/rankers/base.py
@@ -0,0 +1,19 @@
+"""Base Ranker."""
+
+from abc import abstractmethod
+from typing import Optional
+
+from llama_index.core.postprocessor.types import BaseNodePostprocessor
+from llama_index.core.schema import NodeWithScore, QueryBundle
+
+
+class RAGRanker(BaseNodePostprocessor):
+    """inherit from llama_index"""
+
+    @abstractmethod
+    def _postprocess_nodes(
+        self,
+        nodes: list[NodeWithScore],
+        query_bundle: Optional[QueryBundle] = None,
+    ) -> list[NodeWithScore]:
+        """postprocess nodes."""
diff --git a/metagpt/rag/rankers/object_ranker.py b/metagpt/rag/rankers/object_ranker.py
new file mode 100644
index 0000000000..b8456803f6
--- /dev/null
+++ b/metagpt/rag/rankers/object_ranker.py
@@ -0,0 +1,55 @@
+"""Object ranker."""
+
+import heapq
+import json
+from typing import Literal, Optional
+
+from llama_index.core.postprocessor.types import BaseNodePostprocessor
+from llama_index.core.schema import NodeWithScore, QueryBundle
+from pydantic import Field
+
+from metagpt.rag.schema import ObjectNode
+
+
+class ObjectSortPostprocessor(BaseNodePostprocessor):
+    """Sorted by object's field, desc or asc.
+
+    Assumes nodes is list of ObjectNode with score.
+    """
+
+    field_name: str = Field(..., description="field name of the object, field's value must can be compared.")
+    order: Literal["desc", "asc"] = Field(default="desc", description="the direction of order.")
+    top_n: int = 5
+
+    @classmethod
+    def class_name(cls) -> str:
+        return "ObjectSortPostprocessor"
+
+    def _postprocess_nodes(
+        self,
+        nodes: list[NodeWithScore],
+        query_bundle: Optional[QueryBundle] = None,
+    ) -> list[NodeWithScore]:
+        """Postprocess nodes."""
+        if query_bundle is None:
+            raise ValueError("Missing query bundle in extra info.")
+
+        if not nodes:
+            return []
+
+        self._check_metadata(nodes[0].node)
+
+        sort_key = lambda node: json.loads(node.node.metadata["obj_json"])[self.field_name]
+        return self._get_sort_func()(self.top_n, nodes, key=sort_key)
+
+    def _check_metadata(self, node: ObjectNode):
+        try:
+            obj_dict = json.loads(node.metadata.get("obj_json"))
+        except Exception as e:
+            raise ValueError(f"Invalid object json in metadata: {node.metadata}, error: {e}")
+
+        if self.field_name not in obj_dict:
+            raise ValueError(f"Field '{self.field_name}' not found in object: {obj_dict}")
+
+    def _get_sort_func(self):
+        return heapq.nlargest if self.order == "desc" else heapq.nsmallest
diff --git a/metagpt/rag/retrievers/__init__.py b/metagpt/rag/retrievers/__init__.py
new file mode 100644
index 0000000000..2f70e0328f
--- /dev/null
+++ b/metagpt/rag/retrievers/__init__.py
@@ -0,0 +1,5 @@
+"""Retrievers init."""
+
+from metagpt.rag.retrievers.hybrid_retriever import SimpleHybridRetriever
+
+__all__ = ["SimpleHybridRetriever"]
diff --git a/metagpt/rag/retrievers/base.py b/metagpt/rag/retrievers/base.py
new file mode 100644
index 0000000000..a7b8368336
--- /dev/null
+++ b/metagpt/rag/retrievers/base.py
@@ -0,0 +1,47 @@
+"""Base retriever."""
+
+from abc import abstractmethod
+
+from llama_index.core.retrievers import BaseRetriever
+from llama_index.core.schema import BaseNode, NodeWithScore, QueryType
+
+from metagpt.utils.reflection import check_methods
+
+
+class RAGRetriever(BaseRetriever):
+    """Inherit from llama_index"""
+
+    @abstractmethod
+    async def _aretrieve(self, query: QueryType) -> list[NodeWithScore]:
+        """Retrieve nodes"""
+
+    def _retrieve(self, query: QueryType) -> list[NodeWithScore]:
+        """Retrieve nodes"""
+
+
+class ModifiableRAGRetriever(RAGRetriever):
+    """Support modification."""
+
+    @classmethod
+    def __subclasshook__(cls, C):
+        if cls is ModifiableRAGRetriever:
+            return check_methods(C, "add_nodes")
+        return NotImplemented
+
+    @abstractmethod
+    def add_nodes(self, nodes: list[BaseNode], **kwargs) -> None:
+        """To support add docs, must inplement this func"""
+
+
+class PersistableRAGRetriever(RAGRetriever):
+    """Support persistent."""
+
+    @classmethod
+    def __subclasshook__(cls, C):
+        if cls is PersistableRAGRetriever:
+            return check_methods(C, "persist")
+        return NotImplemented
+
+    @abstractmethod
+    def persist(self, persist_dir: str, **kwargs) -> None:
+        """To support persist, must inplement this func"""
diff --git a/metagpt/rag/retrievers/bm25_retriever.py b/metagpt/rag/retrievers/bm25_retriever.py
new file mode 100644
index 0000000000..241820cf4a
--- /dev/null
+++ b/metagpt/rag/retrievers/bm25_retriever.py
@@ -0,0 +1,47 @@
+"""BM25 retriever."""
+from typing import Callable, Optional
+
+from llama_index.core import VectorStoreIndex
+from llama_index.core.callbacks.base import CallbackManager
+from llama_index.core.constants import DEFAULT_SIMILARITY_TOP_K
+from llama_index.core.schema import BaseNode, IndexNode
+from llama_index.retrievers.bm25 import BM25Retriever
+from rank_bm25 import BM25Okapi
+
+
+class DynamicBM25Retriever(BM25Retriever):
+    """BM25 retriever."""
+
+    def __init__(
+        self,
+        nodes: list[BaseNode],
+        tokenizer: Optional[Callable[[str], list[str]]] = None,
+        similarity_top_k: int = DEFAULT_SIMILARITY_TOP_K,
+        callback_manager: Optional[CallbackManager] = None,
+        objects: Optional[list[IndexNode]] = None,
+        object_map: Optional[dict] = None,
+        verbose: bool = False,
+        index: VectorStoreIndex = None,
+    ) -> None:
+        super().__init__(
+            nodes=nodes,
+            tokenizer=tokenizer,
+            similarity_top_k=similarity_top_k,
+            callback_manager=callback_manager,
+            object_map=object_map,
+            objects=objects,
+            verbose=verbose,
+        )
+        self._index = index
+
+    def add_nodes(self, nodes: list[BaseNode], **kwargs) -> None:
+        """Support add nodes."""
+        self._nodes.extend(nodes)
+        self._corpus = [self._tokenizer(node.get_content()) for node in self._nodes]
+        self.bm25 = BM25Okapi(self._corpus)
+
+        self._index.insert_nodes(nodes, **kwargs)
+
+    def persist(self, persist_dir: str, **kwargs) -> None:
+        """Support persist."""
+        self._index.storage_context.persist(persist_dir)
diff --git a/metagpt/rag/retrievers/chroma_retriever.py b/metagpt/rag/retrievers/chroma_retriever.py
new file mode 100644
index 0000000000..d41f375e4c
--- /dev/null
+++ b/metagpt/rag/retrievers/chroma_retriever.py
@@ -0,0 +1,17 @@
+"""Chroma retriever."""
+
+from llama_index.core.retrievers import VectorIndexRetriever
+from llama_index.core.schema import BaseNode
+
+
+class ChromaRetriever(VectorIndexRetriever):
+    """Chroma retriever."""
+
+    def add_nodes(self, nodes: list[BaseNode], **kwargs) -> None:
+        """Support add nodes."""
+        self._index.insert_nodes(nodes, **kwargs)
+
+    def persist(self, persist_dir: str, **kwargs) -> None:
+        """Support persist.
+
+        Chromadb automatically saves, so there is no need to implement."""
diff --git a/metagpt/rag/retrievers/es_retriever.py b/metagpt/rag/retrievers/es_retriever.py
new file mode 100644
index 0000000000..a1a0a6138d
--- /dev/null
+++ b/metagpt/rag/retrievers/es_retriever.py
@@ -0,0 +1,17 @@
+"""Elasticsearch retriever."""
+
+from llama_index.core.retrievers import VectorIndexRetriever
+from llama_index.core.schema import BaseNode
+
+
+class ElasticsearchRetriever(VectorIndexRetriever):
+    """Elasticsearch retriever."""
+
+    def add_nodes(self, nodes: list[BaseNode], **kwargs) -> None:
+        """Support add nodes."""
+        self._index.insert_nodes(nodes, **kwargs)
+
+    def persist(self, persist_dir: str, **kwargs) -> None:
+        """Support persist.
+
+        Elasticsearch automatically saves, so there is no need to implement."""
diff --git a/metagpt/rag/retrievers/faiss_retriever.py b/metagpt/rag/retrievers/faiss_retriever.py
new file mode 100644
index 0000000000..80b4092923
--- /dev/null
+++ b/metagpt/rag/retrievers/faiss_retriever.py
@@ -0,0 +1,16 @@
+"""FAISS retriever."""
+
+from llama_index.core.retrievers import VectorIndexRetriever
+from llama_index.core.schema import BaseNode
+
+
+class FAISSRetriever(VectorIndexRetriever):
+    """FAISS retriever."""
+
+    def add_nodes(self, nodes: list[BaseNode], **kwargs) -> None:
+        """Support add nodes."""
+        self._index.insert_nodes(nodes, **kwargs)
+
+    def persist(self, persist_dir: str, **kwargs) -> None:
+        """Support persist."""
+        self._index.storage_context.persist(persist_dir)
diff --git a/metagpt/rag/retrievers/hybrid_retriever.py b/metagpt/rag/retrievers/hybrid_retriever.py
new file mode 100644
index 0000000000..c725bfc20f
--- /dev/null
+++ b/metagpt/rag/retrievers/hybrid_retriever.py
@@ -0,0 +1,48 @@
+"""Hybrid retriever."""
+
+import copy
+
+from llama_index.core.schema import BaseNode, QueryType
+
+from metagpt.rag.retrievers.base import RAGRetriever
+
+
+class SimpleHybridRetriever(RAGRetriever):
+    """A composite retriever that aggregates search results from multiple retrievers."""
+
+    def __init__(self, *retrievers):
+        self.retrievers: list[RAGRetriever] = retrievers
+        super().__init__()
+
+    async def _aretrieve(self, query: QueryType, **kwargs):
+        """Asynchronously retrieves and aggregates search results from all configured retrievers.
+
+        This method queries each retriever in the `retrievers` list with the given query and
+        additional keyword arguments. It then combines the results, ensuring that each node is
+        unique, based on the node's ID.
+        """
+        all_nodes = []
+        for retriever in self.retrievers:
+            # Prevent retriever changing query
+            query_copy = copy.deepcopy(query)
+            nodes = await retriever.aretrieve(query_copy, **kwargs)
+            all_nodes.extend(nodes)
+
+        # combine all nodes
+        result = []
+        node_ids = set()
+        for n in all_nodes:
+            if n.node.node_id not in node_ids:
+                result.append(n)
+                node_ids.add(n.node.node_id)
+        return result
+
+    def add_nodes(self, nodes: list[BaseNode]) -> None:
+        """Support add nodes."""
+        for r in self.retrievers:
+            r.add_nodes(nodes)
+
+    def persist(self, persist_dir: str, **kwargs) -> None:
+        """Support persist."""
+        for r in self.retrievers:
+            r.persist(persist_dir, **kwargs)
diff --git a/metagpt/rag/schema.py b/metagpt/rag/schema.py
new file mode 100644
index 0000000000..c00486c829
--- /dev/null
+++ b/metagpt/rag/schema.py
@@ -0,0 +1,199 @@
+"""RAG schemas."""
+
+from pathlib import Path
+from typing import Any, ClassVar, Literal, Optional, Union
+
+from chromadb.api.types import CollectionMetadata
+from llama_index.core.embeddings import BaseEmbedding
+from llama_index.core.indices.base import BaseIndex
+from llama_index.core.schema import TextNode
+from llama_index.core.vector_stores.types import VectorStoreQueryMode
+from pydantic import BaseModel, ConfigDict, Field, PrivateAttr, model_validator
+
+from metagpt.config2 import config
+from metagpt.configs.embedding_config import EmbeddingType
+from metagpt.rag.interface import RAGObject
+
+
+class BaseRetrieverConfig(BaseModel):
+    """Common config for retrievers.
+
+    If add new subconfig, it is necessary to add the corresponding instance implementation in rag.factories.retriever.
+    """
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+    similarity_top_k: int = Field(default=5, description="Number of top-k similar results to return during retrieval.")
+
+
+class IndexRetrieverConfig(BaseRetrieverConfig):
+    """Config for Index-basd retrievers."""
+
+    index: BaseIndex = Field(default=None, description="Index for retriver.")
+
+
+class FAISSRetrieverConfig(IndexRetrieverConfig):
+    """Config for FAISS-based retrievers."""
+
+    dimensions: int = Field(default=0, description="Dimensionality of the vectors for FAISS index construction.")
+
+    _embedding_type_to_dimensions: ClassVar[dict[EmbeddingType, int]] = {
+        EmbeddingType.GEMINI: 768,
+        EmbeddingType.OLLAMA: 4096,
+    }
+
+    @model_validator(mode="after")
+    def check_dimensions(self):
+        if self.dimensions == 0:
+            self.dimensions = self._embedding_type_to_dimensions.get(config.embedding.api_type, 1536)
+
+        return self
+
+
+class BM25RetrieverConfig(IndexRetrieverConfig):
+    """Config for BM25-based retrievers."""
+
+    _no_embedding: bool = PrivateAttr(default=True)
+
+
+class ChromaRetrieverConfig(IndexRetrieverConfig):
+    """Config for Chroma-based retrievers."""
+
+    persist_path: Union[str, Path] = Field(default="./chroma_db", description="The directory to save data.")
+    collection_name: str = Field(default="metagpt", description="The name of the collection.")
+    metadata: Optional[CollectionMetadata] = Field(
+        default=None, description="Optional metadata to associate with the collection"
+    )
+
+
+class ElasticsearchStoreConfig(BaseModel):
+    index_name: str = Field(default="metagpt", description="Name of the Elasticsearch index.")
+    es_url: str = Field(default=None, description="Elasticsearch URL.")
+    es_cloud_id: str = Field(default=None, description="Elasticsearch cloud ID.")
+    es_api_key: str = Field(default=None, description="Elasticsearch API key.")
+    es_user: str = Field(default=None, description="Elasticsearch username.")
+    es_password: str = Field(default=None, description="Elasticsearch password.")
+    batch_size: int = Field(default=200, description="Batch size for bulk indexing.")
+    distance_strategy: str = Field(default="COSINE", description="Distance strategy to use for similarity search.")
+
+
+class ElasticsearchRetrieverConfig(IndexRetrieverConfig):
+    """Config for Elasticsearch-based retrievers. Support both vector and text."""
+
+    store_config: ElasticsearchStoreConfig = Field(..., description="ElasticsearchStore config.")
+    vector_store_query_mode: VectorStoreQueryMode = Field(
+        default=VectorStoreQueryMode.DEFAULT, description="default is vector query."
+    )
+
+
+class ElasticsearchKeywordRetrieverConfig(ElasticsearchRetrieverConfig):
+    """Config for Elasticsearch-based retrievers. Support text only."""
+
+    _no_embedding: bool = PrivateAttr(default=True)
+    vector_store_query_mode: Literal[VectorStoreQueryMode.TEXT_SEARCH] = Field(
+        default=VectorStoreQueryMode.TEXT_SEARCH, description="text query only."
+    )
+
+
+class BaseRankerConfig(BaseModel):
+    """Common config for rankers.
+
+    If add new subconfig, it is necessary to add the corresponding instance implementation in rag.factories.ranker.
+    """
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+    top_n: int = Field(default=5, description="The number of top results to return.")
+
+
+class LLMRankerConfig(BaseRankerConfig):
+    """Config for LLM-based rankers."""
+
+    llm: Any = Field(
+        default=None,
+        description="The LLM to rerank with. using Any instead of LLM, as llama_index.core.llms.LLM is pydantic.v1.",
+    )
+
+
+class ColbertRerankConfig(BaseRankerConfig):
+    model: str = Field(default="colbert-ir/colbertv2.0", description="Colbert model name.")
+    device: str = Field(default="cpu", description="Device to use for sentence transformer.")
+    keep_retrieval_score: bool = Field(default=False, description="Whether to keep the retrieval score in metadata.")
+
+
+class ObjectRankerConfig(BaseRankerConfig):
+    field_name: str = Field(..., description="field name of the object, field's value must can be compared.")
+    order: Literal["desc", "asc"] = Field(default="desc", description="the direction of order.")
+
+
+class BaseIndexConfig(BaseModel):
+    """Common config for index.
+
+    If add new subconfig, it is necessary to add the corresponding instance implementation in rag.factories.index.
+    """
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+    persist_path: Union[str, Path] = Field(description="The directory of saved data.")
+
+
+class VectorIndexConfig(BaseIndexConfig):
+    """Config for vector-based index."""
+
+    embed_model: BaseEmbedding = Field(default=None, description="Embed model.")
+
+
+class FAISSIndexConfig(VectorIndexConfig):
+    """Config for faiss-based index."""
+
+
+class ChromaIndexConfig(VectorIndexConfig):
+    """Config for chroma-based index."""
+
+    collection_name: str = Field(default="metagpt", description="The name of the collection.")
+    metadata: Optional[CollectionMetadata] = Field(
+        default=None, description="Optional metadata to associate with the collection"
+    )
+
+
+class BM25IndexConfig(BaseIndexConfig):
+    """Config for bm25-based index."""
+
+    _no_embedding: bool = PrivateAttr(default=True)
+
+
+class ElasticsearchIndexConfig(VectorIndexConfig):
+    """Config for es-based index."""
+
+    store_config: ElasticsearchStoreConfig = Field(..., description="ElasticsearchStore config.")
+    persist_path: Union[str, Path] = ""
+
+
+class ElasticsearchKeywordIndexConfig(ElasticsearchIndexConfig):
+    """Config for es-based index. no embedding."""
+
+    _no_embedding: bool = PrivateAttr(default=True)
+
+
+class ObjectNodeMetadata(BaseModel):
+    """Metadata of ObjectNode."""
+
+    is_obj: bool = Field(default=True)
+    obj: Any = Field(default=None, description="When rag retrieve, will reconstruct obj from obj_json")
+    obj_json: str = Field(..., description="The json of object, e.g. obj.model_dump_json()")
+    obj_cls_name: str = Field(..., description="The class name of object, e.g. obj.__class__.__name__")
+    obj_mod_name: str = Field(..., description="The module name of class, e.g. obj.__class__.__module__")
+
+
+class ObjectNode(TextNode):
+    """RAG add object."""
+
+    def __init__(self, **kwargs):
+        super().__init__(**kwargs)
+        self.excluded_llm_metadata_keys = list(ObjectNodeMetadata.model_fields.keys())
+        self.excluded_embed_metadata_keys = self.excluded_llm_metadata_keys
+
+    @staticmethod
+    def get_obj_metadata(obj: RAGObject) -> dict:
+        metadata = ObjectNodeMetadata(
+            obj_json=obj.model_dump_json(), obj_cls_name=obj.__class__.__name__, obj_mod_name=obj.__class__.__module__
+        )
+
+        return metadata.model_dump()
diff --git a/metagpt/roles/__init__.py b/metagpt/roles/__init__.py
index f033a5dfa2..08a0406b38 100644
--- a/metagpt/roles/__init__.py
+++ b/metagpt/roles/__init__.py
@@ -14,7 +14,6 @@
 from metagpt.roles.qa_engineer import QaEngineer
 from metagpt.roles.searcher import Searcher
 from metagpt.roles.sales import Sales
-from metagpt.roles.customer_service import CustomerService
 
 
 __all__ = [
@@ -26,5 +25,4 @@
     "QaEngineer",
     "Searcher",
     "Sales",
-    "CustomerService",
 ]
diff --git a/metagpt/roles/di/data_interpreter.py b/metagpt/roles/di/data_interpreter.py
index 1943b4234c..547f4b90b2 100644
--- a/metagpt/roles/di/data_interpreter.py
+++ b/metagpt/roles/di/data_interpreter.py
@@ -86,9 +86,13 @@ async def _act(self) -> Message:
         return Message(content=code, role="assistant", cause_by=WriteAnalysisCode)
 
     async def _plan_and_act(self) -> Message:
-        rsp = await super()._plan_and_act()
-        await self.execute_code.terminate()
-        return rsp
+        try:
+            rsp = await super()._plan_and_act()
+            await self.execute_code.terminate()
+            return rsp
+        except Exception as e:
+            await self.execute_code.terminate()
+            raise e
 
     async def _act_on_task(self, current_task: Task) -> TaskResult:
         """Useful in 'plan_and_act' mode. Wrap the output in a TaskResult for review and confirmation."""
diff --git a/metagpt/roles/engineer.py b/metagpt/roles/engineer.py
index 329b21553f..6962b1bb5b 100644
--- a/metagpt/roles/engineer.py
+++ b/metagpt/roles/engineer.py
@@ -22,7 +22,7 @@
 import json
 from collections import defaultdict
 from pathlib import Path
-from typing import Set
+from typing import Optional, Set
 
 from metagpt.actions import Action, WriteCode, WriteCodeReview, WriteTasks
 from metagpt.actions.fix_bug import FixBug
@@ -30,6 +30,7 @@
 from metagpt.actions.summarize_code import SummarizeCode
 from metagpt.actions.write_code_plan_and_change_an import WriteCodePlanAndChange
 from metagpt.const import (
+    BUGFIX_FILENAME,
     CODE_PLAN_AND_CHANGE_FILE_REPO,
     REQUIREMENT_FILENAME,
     SYSTEM_DESIGN_FILE_REPO,
@@ -208,9 +209,9 @@ async def _act_code_plan_and_change(self):
         code_plan_and_change = node.instruct_content.model_dump_json()
         dependencies = {
             REQUIREMENT_FILENAME,
-            self.rc.todo.i_context.prd_filename,
-            self.rc.todo.i_context.design_filename,
-            self.rc.todo.i_context.task_filename,
+            str(self.project_repo.docs.prd.root_path / self.rc.todo.i_context.prd_filename),
+            str(self.project_repo.docs.system_design.root_path / self.rc.todo.i_context.design_filename),
+            str(self.project_repo.docs.task.root_path / self.rc.todo.i_context.task_filename),
         }
         code_plan_and_change_filepath = Path(self.rc.todo.i_context.design_filename)
         await self.project_repo.docs.code_plan_and_change.save(
@@ -240,19 +241,19 @@ async def _is_pass(self, summary) -> (str, str):
     async def _think(self) -> Action | None:
         if not self.src_workspace:
             self.src_workspace = self.git_repo.workdir / self.git_repo.workdir.name
-        write_plan_and_change_filters = any_to_str_set([WriteTasks])
-        write_code_filters = any_to_str_set([WriteTasks, WriteCodePlanAndChange, SummarizeCode, FixBug])
+        write_plan_and_change_filters = any_to_str_set([WriteTasks, FixBug])
+        write_code_filters = any_to_str_set([WriteTasks, WriteCodePlanAndChange, SummarizeCode])
         summarize_code_filters = any_to_str_set([WriteCode, WriteCodeReview])
         if not self.rc.news:
             return None
         msg = self.rc.news[0]
         if self.config.inc and msg.cause_by in write_plan_and_change_filters:
             logger.debug(f"TODO WriteCodePlanAndChange:{msg.model_dump_json()}")
-            await self._new_code_plan_and_change_action()
+            await self._new_code_plan_and_change_action(cause_by=msg.cause_by)
             return self.rc.todo
         if msg.cause_by in write_code_filters:
             logger.debug(f"TODO WriteCode:{msg.model_dump_json()}")
-            await self._new_code_actions(bug_fix=msg.cause_by == any_to_str(FixBug))
+            await self._new_code_actions()
             return self.rc.todo
         if msg.cause_by in summarize_code_filters and msg.sent_from == any_to_str(self):
             logger.debug(f"TODO SummarizeCode:{msg.model_dump_json()}")
@@ -267,7 +268,7 @@ async def _new_coding_context(self, filename, dependency) -> CodingContext:
         dependencies = {Path(i) for i in await dependency.get(old_code_doc.root_relative_path)}
         task_doc = None
         design_doc = None
-        code_plan_and_change_doc = None
+        code_plan_and_change_doc = await self._get_any_code_plan_and_change() if await self._is_fixbug() else None
         for i in dependencies:
             if str(i.parent) == TASK_FILE_REPO:
                 task_doc = await self.project_repo.docs.task.get(i.name)
@@ -294,7 +295,8 @@ async def _new_coding_doc(self, filename, dependency):
         )
         return coding_doc
 
-    async def _new_code_actions(self, bug_fix=False):
+    async def _new_code_actions(self):
+        bug_fix = await self._is_fixbug()
         # Prepare file repos
         changed_src_files = self.project_repo.srcs.all_files if bug_fix else self.project_repo.srcs.changed_files
         changed_task_files = self.project_repo.docs.task.changed_files
@@ -371,15 +373,32 @@ async def _new_summarize_actions(self):
             self.set_todo(self.summarize_todos[0])
             self.summarize_todos.pop(0)
 
-    async def _new_code_plan_and_change_action(self):
+    async def _new_code_plan_and_change_action(self, cause_by: str):
         """Create a WriteCodePlanAndChange action for subsequent to-do actions."""
         files = self.project_repo.all_files
-        requirement_doc = await self.project_repo.docs.get(REQUIREMENT_FILENAME)
-        requirement = requirement_doc.content if requirement_doc else ""
-        code_plan_and_change_ctx = CodePlanAndChangeContext.loads(files, requirement=requirement)
+        options = {}
+        if cause_by != any_to_str(FixBug):
+            requirement_doc = await self.project_repo.docs.get(REQUIREMENT_FILENAME)
+            options["requirement"] = requirement_doc.content
+        else:
+            fixbug_doc = await self.project_repo.docs.get(BUGFIX_FILENAME)
+            options["issue"] = fixbug_doc.content
+        code_plan_and_change_ctx = CodePlanAndChangeContext.loads(files, **options)
         self.rc.todo = WriteCodePlanAndChange(i_context=code_plan_and_change_ctx, context=self.context, llm=self.llm)
 
     @property
     def action_description(self) -> str:
         """AgentStore uses this attribute to display to the user what actions the current role should take."""
         return self.next_todo_action
+
+    async def _is_fixbug(self) -> bool:
+        fixbug_doc = await self.project_repo.docs.get(BUGFIX_FILENAME)
+        return bool(fixbug_doc and fixbug_doc.content)
+
+    async def _get_any_code_plan_and_change(self) -> Optional[Document]:
+        changed_files = self.project_repo.docs.code_plan_and_change.changed_files
+        for filename in changed_files.keys():
+            doc = await self.project_repo.docs.code_plan_and_change.get(filename)
+            if doc and doc.content:
+                return doc
+        return None
diff --git a/metagpt/roles/role.py b/metagpt/roles/role.py
index 832a000b11..57dd511398 100644
--- a/metagpt/roles/role.py
+++ b/metagpt/roles/role.py
@@ -108,12 +108,6 @@ class RoleContext(BaseModel):
     )  # see `Role._set_react_mode` for definitions of the following two attributes
     max_react_loop: int = 1
 
-    def check(self, role_id: str):
-        # if hasattr(CONFIG, "enable_longterm_memory") and CONFIG.enable_longterm_memory:
-        #     self.long_term_memory.recover_memory(role_id, self)
-        #     self.memory = self.long_term_memory  # use memory to act as long_term_memory for unify operation
-        pass
-
     @property
     def important_memory(self) -> list[Message]:
         """Retrieve information corresponding to the attention action."""
@@ -175,6 +169,7 @@ def _process_role_extra(self):
 
         self._check_actions()
         self.llm.system_prompt = self._get_prefix()
+        self.llm.cost_manager = self.context.cost_manager
         self._watch(kwargs.pop("watch", [UserRequirement]))
 
         if self.latest_observed_msg:
@@ -311,8 +306,6 @@ def _watch(self, actions: Iterable[Type[Action]] | Iterable[Action]):
         buffer during _observe.
         """
         self.rc.watch = {any_to_str(t) for t in actions}
-        # check RoleContext after adding watch actions
-        self.rc.check(self.role_id)
 
     def is_watch(self, caused_by: str):
         return caused_by in self.rc.watch
@@ -339,8 +332,14 @@ def set_env(self, env: "Environment"):
         if env:
             env.set_addresses(self, self.addresses)
             self.llm.system_prompt = self._get_prefix()
+            self.llm.cost_manager = self.context.cost_manager
             self.set_actions(self.actions)  # reset actions to update llm and prefix
 
+    @property
+    def name(self):
+        """Get the role name"""
+        return self._setting.name
+
     def _get_prefix(self):
         """Get the role prefix"""
         if self.desc:
diff --git a/metagpt/roles/sales.py b/metagpt/roles/sales.py
index bc449b5cd2..e5cb12778f 100644
--- a/metagpt/roles/sales.py
+++ b/metagpt/roles/sales.py
@@ -11,7 +11,6 @@
 from pydantic import Field, model_validator
 
 from metagpt.actions import SearchAndSummarize, UserRequirement
-from metagpt.document_store.base_store import BaseStore
 from metagpt.roles import Role
 from metagpt.tools.search_engine import SearchEngine
 
@@ -27,7 +26,7 @@ class Sales(Role):
         "delivered with the professionalism and courtesy expected of a seasoned sales guide."
     )
 
-    store: Optional[BaseStore] = Field(default=None, exclude=True)
+    store: Optional[object] = Field(default=None, exclude=True)  # must inplement tools.SearchInterface
 
     @model_validator(mode="after")
     def validate_stroe(self):
diff --git a/metagpt/schema.py b/metagpt/schema.py
index 7906febe0f..071518d62e 100644
--- a/metagpt/schema.py
+++ b/metagpt/schema.py
@@ -233,6 +233,10 @@ def check_sent_from(cls, sent_from: Any) -> str:
     def check_send_to(cls, send_to: Any) -> set:
         return any_to_str_set(send_to if send_to else {MESSAGE_ROUTE_TO_ALL})
 
+    @field_serializer("send_to", mode="plain")
+    def ser_send_to(self, send_to: set) -> list:
+        return list(send_to)
+
     @field_serializer("instruct_content", mode="plain")
     def ser_instruct_content(self, ic: BaseModel) -> Union[dict, None]:
         ic_dict = None
@@ -276,6 +280,10 @@ def __str__(self):
     def __repr__(self):
         return self.__str__()
 
+    def rag_key(self) -> str:
+        """For search"""
+        return self.content
+
     def to_dict(self) -> dict:
         """Return a dict containing `role` and `content` for the LLM call.l"""
         return {"role": self.role, "content": self.content}
@@ -669,13 +677,14 @@ class BugFixContext(BaseContext):
 
 class CodePlanAndChangeContext(BaseModel):
     requirement: str = ""
+    issue: str = ""
     prd_filename: str = ""
     design_filename: str = ""
     task_filename: str = ""
 
     @staticmethod
     def loads(filenames: List, **kwargs) -> CodePlanAndChangeContext:
-        ctx = CodePlanAndChangeContext(requirement=kwargs.get("requirement", ""))
+        ctx = CodePlanAndChangeContext(requirement=kwargs.get("requirement", ""), issue=kwargs.get("issue", ""))
         for filename in filenames:
             filename = Path(filename)
             if filename.is_relative_to(PRDS_FILE_REPO):
diff --git a/metagpt/startup.py b/metagpt/startup.py
new file mode 100644
index 0000000000..bb6f6abf2a
--- /dev/null
+++ b/metagpt/startup.py
@@ -0,0 +1,10 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+"""
+@Time    : 2024/3/11 19:16
+@Author  : alexanderwu
+@File    : startup.py
+"""
+
+# DEPRECATED: This file is deprecated and will be removed in the future.
+# The startup.py implementation has been moved to software_company.py
diff --git a/metagpt/team.py b/metagpt/team.py
index 35f987b576..cf83462591 100644
--- a/metagpt/team.py
+++ b/metagpt/team.py
@@ -56,8 +56,10 @@ def __init__(self, context: Context = None, **data: Any):
     def serialize(self, stg_path: Path = None):
         stg_path = SERDESER_PATH.joinpath("team") if stg_path is None else stg_path
         team_info_path = stg_path.joinpath("team.json")
+        serialized_data = self.model_dump()
+        serialized_data["context"] = self.env.context.serialize()
 
-        write_json_file(team_info_path, self.model_dump())
+        write_json_file(team_info_path, serialized_data)
 
     @classmethod
     def deserialize(cls, stg_path: Path, context: Context = None) -> "Team":
@@ -71,6 +73,7 @@ def deserialize(cls, stg_path: Path, context: Context = None) -> "Team":
 
         team_info: dict = read_json_file(team_info_path)
         ctx = context or Context()
+        ctx.deserialize(team_info.pop("context", None))
         team = Team(**team_info, context=ctx)
         return team
 
@@ -116,9 +119,6 @@ def start_project(self, idea, send_to: str = ""):
         )
         return self.run_project(idea=idea, send_to=send_to)
 
-    def _save(self):
-        logger.info(self.model_dump_json())
-
     @serialize_decorator
     async def run(self, n_round=3, idea="", send_to="", auto_archive=True):
         """Run company until target round or no money"""
@@ -126,11 +126,10 @@ async def run(self, n_round=3, idea="", send_to="", auto_archive=True):
             self.run_project(idea=idea, send_to=send_to)
 
         while n_round > 0:
-            # self._save()
             n_round -= 1
-            logger.debug(f"max {n_round=} left.")
             self._check_balance()
-
             await self.env.run()
+
+            logger.debug(f"max {n_round=} left.")
         self.env.archive(auto_archive)
         return self.env.history
diff --git a/metagpt/tools/__init__.py b/metagpt/tools/__init__.py
index c1f604df91..35fa046589 100644
--- a/metagpt/tools/__init__.py
+++ b/metagpt/tools/__init__.py
@@ -19,6 +19,7 @@ class SearchEngineType(Enum):
     DIRECT_GOOGLE = "google"
     DUCK_DUCK_GO = "ddg"
     CUSTOM_ENGINE = "custom"
+    BING = "bing"
 
 
 class WebBrowserEngineType(Enum):
@@ -30,3 +31,8 @@ class WebBrowserEngineType(Enum):
     def __missing__(cls, key):
         """Default type conversion"""
         return cls.CUSTOM
+
+
+class SearchInterface:
+    async def asearch(self, *args, **kwargs):
+        ...
diff --git a/metagpt/tools/search_engine.py b/metagpt/tools/search_engine.py
index 1e540bd0e2..767f4aabaa 100644
--- a/metagpt/tools/search_engine.py
+++ b/metagpt/tools/search_engine.py
@@ -88,6 +88,9 @@ def _process_extra(
             run_func = importlib.import_module(module).DDGAPIWrapper(**kwargs).run
         elif self.engine == SearchEngineType.CUSTOM_ENGINE:
             run_func = self.run_func
+        elif self.engine == SearchEngineType.BING:
+            module = "metagpt.tools.search_engine_bing"
+            run_func = importlib.import_module(module).BingAPIWrapper(**kwargs).run
         else:
             raise NotImplementedError
         self.run_func = run_func
diff --git a/metagpt/tools/search_engine_bing.py b/metagpt/tools/search_engine_bing.py
new file mode 100644
index 0000000000..0bc5b5d130
--- /dev/null
+++ b/metagpt/tools/search_engine_bing.py
@@ -0,0 +1,106 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+from __future__ import annotations
+
+import json
+import warnings
+from typing import Optional
+
+import aiohttp
+from pydantic import BaseModel, ConfigDict, model_validator
+
+
+class BingAPIWrapper(BaseModel):
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+
+    api_key: str
+    bing_url: str = "https://api.bing.microsoft.com/v7.0/search"
+    aiosession: Optional[aiohttp.ClientSession] = None
+    proxy: Optional[str] = None
+
+    @model_validator(mode="before")
+    @classmethod
+    def validate_api_key(cls, values: dict) -> dict:
+        if "api_key" in values:
+            values.setdefault("api_key", values["api_key"])
+            warnings.warn("`api_key` is deprecated, use `api_key` instead", DeprecationWarning, stacklevel=2)
+        return values
+
+    @property
+    def header(self):
+        return {"Ocp-Apim-Subscription-Key": self.api_key}
+
+    async def run(
+        self,
+        query: str,
+        max_results: int = 8,
+        as_string: bool = True,
+        focus: list[str] | None = None,
+    ) -> str | list[dict]:
+        """Return the results of a Google search using the official Bing API.
+
+        Args:
+            query: The search query.
+            max_results: The number of results to return.
+            as_string: A boolean flag to determine the return type of the results. If True, the function will
+                return a formatted string with the search results. If False, it will return a list of dictionaries
+                containing detailed information about each search result.
+            focus: Specific information to be focused on from each search result.
+
+        Returns:
+            The results of the search.
+        """
+        params = {
+            "q": query,
+            "count": max_results,
+            "textFormat": "HTML",
+        }
+        result = await self.results(params)
+        search_results = result["webPages"]["value"]
+        focus = focus or ["snippet", "link", "title"]
+        for item_dict in search_results:
+            item_dict["link"] = item_dict["url"]
+            item_dict["title"] = item_dict["name"]
+        details = [{i: j for i, j in item_dict.items() if i in focus} for item_dict in search_results]
+        if as_string:
+            return safe_results(details)
+        return details
+
+    async def results(self, params: dict) -> dict:
+        """Use aiohttp to run query and return the results async."""
+
+        if not self.aiosession:
+            async with aiohttp.ClientSession() as session:
+                async with session.get(self.bing_url, params=params, headers=self.header, proxy=self.proxy) as response:
+                    response.raise_for_status()
+                    res = await response.json()
+        else:
+            async with self.aiosession.get(
+                self.bing_url, params=params, headers=self.header, proxy=self.proxy
+            ) as response:
+                response.raise_for_status()
+                res = await response.json()
+
+        return res
+
+
+def safe_results(results: str | list) -> str:
+    """Return the results of a bing search in a safe format.
+
+    Args:
+        results: The search results.
+
+    Returns:
+        The results of the search.
+    """
+    if isinstance(results, list):
+        safe_message = json.dumps([result for result in results])
+    else:
+        safe_message = results.encode("utf-8", "ignore").decode("utf-8")
+    return safe_message
+
+
+if __name__ == "__main__":
+    import fire
+
+    fire.Fire(BingAPIWrapper().run)
diff --git a/metagpt/tools/web_browser_engine_selenium.py b/metagpt/tools/web_browser_engine_selenium.py
index 3b1682291b..7867154618 100644
--- a/metagpt/tools/web_browser_engine_selenium.py
+++ b/metagpt/tools/web_browser_engine_selenium.py
@@ -103,7 +103,7 @@ def __init__(self, proxy: str = None):
 
     def get(self, url, **kwargs):
         if "proxies" not in kwargs and self.proxy:
-            kwargs["proxies"] = {"all_proxy": self.proxy}
+            kwargs["proxies"] = {"all": self.proxy}
         return super().get(url, **kwargs)
 
 
diff --git a/metagpt/utils/async_helper.py b/metagpt/utils/async_helper.py
new file mode 100644
index 0000000000..cecb20c5dd
--- /dev/null
+++ b/metagpt/utils/async_helper.py
@@ -0,0 +1,37 @@
+import asyncio
+import threading
+from typing import Any
+
+
+def run_coroutine_in_new_loop(coroutine) -> Any:
+    """Runs a coroutine in a new, separate event loop on a different thread.
+
+    This function is useful when try to execute an async function within a sync function, but encounter the error `RuntimeError: This event loop is already running`.
+    """
+    new_loop = asyncio.new_event_loop()
+    t = threading.Thread(target=lambda: new_loop.run_forever())
+    t.start()
+
+    future = asyncio.run_coroutine_threadsafe(coroutine, new_loop)
+
+    try:
+        return future.result()
+    finally:
+        new_loop.call_soon_threadsafe(new_loop.stop)
+        t.join()
+        new_loop.close()
+
+
+class NestAsyncio:
+    """Make asyncio event loop reentrant."""
+
+    is_applied = False
+
+    @classmethod
+    def apply_once(cls):
+        """Ensures `nest_asyncio.apply()` is called only once."""
+        if not cls.is_applied:
+            import nest_asyncio
+
+            nest_asyncio.apply()
+            cls.is_applied = True
diff --git a/metagpt/utils/common.py b/metagpt/utils/common.py
index e9cef69a4a..0876b85ad6 100644
--- a/metagpt/utils/common.py
+++ b/metagpt/utils/common.py
@@ -18,6 +18,7 @@
 import importlib
 import inspect
 import json
+import mimetypes
 import os
 import platform
 import re
@@ -29,6 +30,7 @@
 from urllib.parse import quote, unquote
 
 import aiofiles
+import chardet
 import loguru
 import requests
 from PIL import Image
@@ -663,14 +665,21 @@ async def wrapper(self, *args, **kwargs):
 
 
 @handle_exception
-async def aread(filename: str | Path, encoding=None) -> str:
+async def aread(filename: str | Path, encoding="utf-8") -> str:
     """Read file asynchronously."""
-    async with aiofiles.open(str(filename), mode="r", encoding=encoding) as reader:
-        content = await reader.read()
+    try:
+        async with aiofiles.open(str(filename), mode="r", encoding=encoding) as reader:
+            content = await reader.read()
+    except UnicodeDecodeError:
+        async with aiofiles.open(str(filename), mode="rb") as reader:
+            raw = await reader.read()
+            result = chardet.detect(raw)
+            detected_encoding = result["encoding"]
+            content = raw.decode(detected_encoding)
     return content
 
 
-async def awrite(filename: str | Path, data: str, encoding=None):
+async def awrite(filename: str | Path, data: str, encoding="utf-8"):
     """Write file asynchronously."""
     pathname = Path(filename)
     pathname.parent.mkdir(parents=True, exist_ok=True)
@@ -713,7 +722,10 @@ def list_files(root: str | Path) -> List[Path]:
 
 
 def parse_json_code_block(markdown_text: str) -> List[str]:
-    json_blocks = re.findall(r"```json(.*?)```", markdown_text, re.DOTALL)
+    json_blocks = (
+        re.findall(r"```json(.*?)```", markdown_text, re.DOTALL) if "```json" in markdown_text else [markdown_text]
+    )
+
     return [v.strip() for v in json_blocks]
 
 
@@ -765,7 +777,7 @@ def is_coroutine_func(func: Callable) -> bool:
 
 
 def load_mc_skills_code(skill_names: list[str] = None, skills_dir: Path = None) -> list[str]:
-    """load mincraft skill from js files"""
+    """load minecraft skill from js files"""
     if not skills_dir:
         skills_dir = Path(__file__).parent.absolute()
     if skill_names is None:
@@ -802,29 +814,6 @@ def decode_image(img_url_or_b64: str) -> Image:
     return img
 
 
-def process_message(messages: Union[str, Message, list[dict], list[Message], list[str]]) -> list[dict]:
-    """convert messages to list[dict]."""
-    from metagpt.schema import Message
-
-    # 全部转成list
-    if not isinstance(messages, list):
-        messages = [messages]
-
-    # 转成list[dict]
-    processed_messages = []
-    for msg in messages:
-        if isinstance(msg, str):
-            processed_messages.append({"role": "user", "content": msg})
-        elif isinstance(msg, dict):
-            assert set(msg.keys()) == set(["role", "content"])
-            processed_messages.append(msg)
-        elif isinstance(msg, Message):
-            processed_messages.append(msg.to_dict())
-        else:
-            raise ValueError(f"Only support message type are: str, Message, dict, but got {type(messages).__name__}!")
-    return processed_messages
-
-
 def log_and_reraise(retry_state: RetryCallState):
     logger.error(f"Retry attempts exhausted. Last exception: {retry_state.outcome.exception()}")
     logger.warning(
@@ -834,3 +823,21 @@ def log_and_reraise(retry_state: RetryCallState):
 """
     )
     raise retry_state.outcome.exception()
+
+
+def get_markdown_codeblock_type(filename: str) -> str:
+    """Return the markdown code-block type corresponding to the file extension."""
+    mime_type, _ = mimetypes.guess_type(filename)
+    mappings = {
+        "text/x-shellscript": "bash",
+        "text/x-c++src": "cpp",
+        "text/css": "css",
+        "text/html": "html",
+        "text/x-java": "java",
+        "application/javascript": "javascript",
+        "application/json": "json",
+        "text/x-python": "python",
+        "text/x-ruby": "ruby",
+        "application/sql": "sql",
+    }
+    return mappings.get(mime_type, "text")
diff --git a/metagpt/utils/dependency_file.py b/metagpt/utils/dependency_file.py
index d3add11712..0a375051c2 100644
--- a/metagpt/utils/dependency_file.py
+++ b/metagpt/utils/dependency_file.py
@@ -13,9 +13,7 @@
 from pathlib import Path
 from typing import Set
 
-import aiofiles
-
-from metagpt.utils.common import aread
+from metagpt.utils.common import aread, awrite
 from metagpt.utils.exceptions import handle_exception
 
 
@@ -45,8 +43,7 @@ async def load(self):
     async def save(self):
         """Save dependencies to the file asynchronously."""
         data = json.dumps(self._dependencies)
-        async with aiofiles.open(str(self._filename), mode="w") as writer:
-            await writer.write(data)
+        await awrite(filename=self._filename, data=data)
 
     async def update(self, filename: Path | str, dependencies: Set[Path | str], persist=True):
         """Update dependencies for a file asynchronously.
diff --git a/metagpt/utils/embedding.py b/metagpt/utils/embedding.py
index 21d62948cc..3d53a314ce 100644
--- a/metagpt/utils/embedding.py
+++ b/metagpt/utils/embedding.py
@@ -5,12 +5,15 @@
 @Author  : alexanderwu
 @File    : embedding.py
 """
-from langchain_community.embeddings import OpenAIEmbeddings
+from llama_index.embeddings.openai import OpenAIEmbedding
 
 from metagpt.config2 import config
 
 
-def get_embedding():
+def get_embedding() -> OpenAIEmbedding:
     llm = config.get_openai_llm()
-    embedding = OpenAIEmbeddings(openai_api_key=llm.api_key, openai_api_base=llm.base_url)
+    if llm is None:
+        raise ValueError("To use OpenAIEmbedding, please ensure that config.llm.api_type is correctly set to 'openai'.")
+
+    embedding = OpenAIEmbedding(api_key=llm.api_key, api_base=llm.base_url)
     return embedding
diff --git a/metagpt/utils/file_repository.py b/metagpt/utils/file_repository.py
index d2a06963aa..d19f2b7052 100644
--- a/metagpt/utils/file_repository.py
+++ b/metagpt/utils/file_repository.py
@@ -14,11 +14,9 @@
 from pathlib import Path
 from typing import Dict, List, Set
 
-import aiofiles
-
 from metagpt.logs import logger
 from metagpt.schema import Document
-from metagpt.utils.common import aread
+from metagpt.utils.common import aread, awrite
 from metagpt.utils.json_to_markdown import json_to_markdown
 
 
@@ -55,8 +53,7 @@ async def save(self, filename: Path | str, content, dependencies: List[str] = No
         pathname = self.workdir / filename
         pathname.parent.mkdir(parents=True, exist_ok=True)
         content = content if content else ""  # avoid `argument must be str, not None` to make it continue
-        async with aiofiles.open(str(pathname), mode="w") as writer:
-            await writer.write(content)
+        await awrite(filename=str(pathname), data=content)
         logger.info(f"save to: {str(pathname)}")
 
         if dependencies is not None:
diff --git a/metagpt/utils/mermaid.py b/metagpt/utils/mermaid.py
index ae3c5118fe..ba33b8d615 100644
--- a/metagpt/utils/mermaid.py
+++ b/metagpt/utils/mermaid.py
@@ -9,11 +9,9 @@
 import os
 from pathlib import Path
 
-import aiofiles
-
 from metagpt.config2 import config
 from metagpt.logs import logger
-from metagpt.utils.common import check_cmd_exists
+from metagpt.utils.common import awrite, check_cmd_exists
 
 
 async def mermaid_to_file(engine, mermaid_code, output_file_without_suffix, width=2048, height=2048) -> int:
@@ -30,9 +28,7 @@ async def mermaid_to_file(engine, mermaid_code, output_file_without_suffix, widt
     if dir_name and not os.path.exists(dir_name):
         os.makedirs(dir_name)
     tmp = Path(f"{output_file_without_suffix}.mmd")
-    async with aiofiles.open(tmp, "w", encoding="utf-8") as f:
-        await f.write(mermaid_code)
-    # tmp.write_text(mermaid_code, encoding="utf-8")
+    await awrite(filename=tmp, data=mermaid_code)
 
     if engine == "nodejs":
         if check_cmd_exists(config.mermaid.path) != 0:
@@ -85,6 +81,8 @@ async def mermaid_to_file(engine, mermaid_code, output_file_without_suffix, widt
             from metagpt.utils.mmdc_ink import mermaid_to_file
 
             return await mermaid_to_file(mermaid_code, output_file_without_suffix)
+        elif engine == "none":
+            return 0
         else:
             logger.warning(f"Unsupported mermaid engine: {engine}")
     return 0
diff --git a/metagpt/utils/recovery_util.py b/metagpt/utils/recovery_util.py
index d0b197e699..2089ae018d 100644
--- a/metagpt/utils/recovery_util.py
+++ b/metagpt/utils/recovery_util.py
@@ -54,5 +54,5 @@ def save_history(role: Role, save_dir: str = ""):
     with open(save_path / "plan.json", "w", encoding="utf-8") as plan_file:
         json.dump(plan, plan_file, indent=4, ensure_ascii=False)
 
-    save_code_file(name=Path(record_time) / "history_nb", code_context=role.execute_code.nb, file_format="ipynb")
+    save_code_file(name=Path(record_time), code_context=role.execute_code.nb, file_format="ipynb")
     return save_path
diff --git a/metagpt/utils/reflection.py b/metagpt/utils/reflection.py
new file mode 100644
index 0000000000..8b8237ae7a
--- /dev/null
+++ b/metagpt/utils/reflection.py
@@ -0,0 +1,18 @@
+"""class tools, including method inspection, class attributes, inheritance relationships, etc."""
+
+
+def check_methods(C, *methods):
+    """Check if the class has methods. borrow from _collections_abc.
+
+    Useful when implementing implicit interfaces, such as defining an abstract class, isinstance can be used for determination without inheritance.
+    """
+    mro = C.__mro__
+    for method in methods:
+        for B in mro:
+            if method in B.__dict__:
+                if B.__dict__[method] is None:
+                    return NotImplemented
+                break
+        else:
+            return NotImplemented
+    return True
diff --git a/metagpt/utils/repair_llm_raw_output.py b/metagpt/utils/repair_llm_raw_output.py
index b8756e8c64..17e095c5f5 100644
--- a/metagpt/utils/repair_llm_raw_output.py
+++ b/metagpt/utils/repair_llm_raw_output.py
@@ -340,7 +340,9 @@ def extract_state_value_from_output(content: str) -> str:
         content (str): llm's output from `Role._think`
     """
     content = content.strip()  # deal the output cases like " 0", "0\n" and so on.
-    pattern = r"([0-9])"  # TODO find the number using a more proper method not just extract from content using pattern
+    pattern = (
+        r"(?<!-)[0-9]"  # TODO find the number using a more proper method not just extract from content using pattern
+    )
     matches = re.findall(pattern, content, re.DOTALL)
     matches = list(set(matches))
     state = matches[0] if len(matches) > 0 else "-1"
diff --git a/metagpt/utils/repo_to_markdown.py b/metagpt/utils/repo_to_markdown.py
new file mode 100644
index 0000000000..76dfe1b829
--- /dev/null
+++ b/metagpt/utils/repo_to_markdown.py
@@ -0,0 +1,80 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+"""
+This file provides functionality to convert a local repository into a markdown representation.
+"""
+from __future__ import annotations
+
+import mimetypes
+from pathlib import Path
+
+from gitignore_parser import parse_gitignore
+
+from metagpt.logs import logger
+from metagpt.utils.common import aread, awrite, get_markdown_codeblock_type, list_files
+from metagpt.utils.tree import tree
+
+
+async def repo_to_markdown(repo_path: str | Path, output: str | Path = None, gitignore: str | Path = None) -> str:
+    """
+    Convert a local repository into a markdown representation.
+
+    This function takes a path to a local repository and generates a markdown representation of the repository structure,
+    including directory trees and file listings.
+
+    Args:
+        repo_path (str | Path): The path to the local repository.
+        output (str | Path, optional): The path to save the generated markdown file. Defaults to None.
+        gitignore (str | Path, optional): The path to the .gitignore file. Defaults to None.
+
+    Returns:
+        str: The markdown representation of the repository.
+    """
+    repo_path = Path(repo_path)
+    gitignore = Path(gitignore or Path(__file__).parent / "../../.gitignore").resolve()
+
+    markdown = await _write_dir_tree(repo_path=repo_path, gitignore=gitignore)
+
+    gitignore_rules = parse_gitignore(full_path=str(gitignore))
+    markdown += await _write_files(repo_path=repo_path, gitignore_rules=gitignore_rules)
+
+    if output:
+        await awrite(filename=str(output), data=markdown, encoding="utf-8")
+    return markdown
+
+
+async def _write_dir_tree(repo_path: Path, gitignore: Path) -> str:
+    try:
+        content = tree(repo_path, gitignore, run_command=True)
+    except Exception as e:
+        logger.info(f"{e}, using safe mode.")
+        content = tree(repo_path, gitignore, run_command=False)
+
+    doc = f"## Directory Tree\n```text\n{content}\n```\n---\n\n"
+    return doc
+
+
+async def _write_files(repo_path, gitignore_rules) -> str:
+    filenames = list_files(repo_path)
+    markdown = ""
+    for filename in filenames:
+        if gitignore_rules(str(filename)):
+            continue
+        markdown += await _write_file(filename=filename, repo_path=repo_path)
+    return markdown
+
+
+async def _write_file(filename: Path, repo_path: Path) -> str:
+    relative_path = filename.relative_to(repo_path)
+    markdown = f"## {relative_path}\n"
+
+    mime_type, _ = mimetypes.guess_type(filename.name)
+    if "text/" not in mime_type:
+        logger.info(f"Ignore content: {filename}")
+        markdown += "<binary file>\n---\n\n"
+        return markdown
+    content = await aread(filename, encoding="utf-8")
+    content = content.replace("```", "\\`\\`\\`").replace("---", "\\-\\-\\-")
+    code_block_type = get_markdown_codeblock_type(filename.name)
+    markdown += f"```{code_block_type}\n{content}\n```\n---\n\n"
+    return markdown
diff --git a/metagpt/utils/stream_pipe.py b/metagpt/utils/stream_pipe.py
new file mode 100644
index 0000000000..4c44851581
--- /dev/null
+++ b/metagpt/utils/stream_pipe.py
@@ -0,0 +1,40 @@
+# -*- coding: utf-8 -*-
+# @Time    : 2024/3/27 10:00
+# @Author  : leiwu30
+# @File    : stream_pipe.py
+# @Version : None
+# @Description : None
+
+import json
+import time
+from multiprocessing import Pipe
+
+
+class StreamPipe:
+    parent_conn, child_conn = Pipe()
+    finish: bool = False
+
+    format_data = {
+        "id": "chatcmpl-96bVnBOOyPFZZxEoTIGbdpFcVEnur",
+        "object": "chat.completion.chunk",
+        "created": 1711361191,
+        "model": "gpt-3.5-turbo-0125",
+        "system_fingerprint": "fp_3bc1b5746c",
+        "choices": [
+            {"index": 0, "delta": {"role": "assistant", "content": "content"}, "logprobs": None, "finish_reason": None}
+        ],
+    }
+
+    def set_message(self, msg):
+        self.parent_conn.send(msg)
+
+    def get_message(self, timeout: int = 3):
+        if self.child_conn.poll(timeout):
+            return self.child_conn.recv()
+        else:
+            return None
+
+    def msg2stream(self, msg):
+        self.format_data["created"] = int(time.time())
+        self.format_data["choices"][0]["delta"]["content"] = msg
+        return f"data: {json.dumps(self.format_data, ensure_ascii=False)}\n".encode("utf-8")
diff --git a/metagpt/utils/token_counter.py b/metagpt/utils/token_counter.py
index f7c53706bb..0ca22cf358 100644
--- a/metagpt/utils/token_counter.py
+++ b/metagpt/utils/token_counter.py
@@ -21,12 +21,14 @@
     "gpt-35-turbo": {"prompt": 0.0015, "completion": 0.002},
     "gpt-35-turbo-16k": {"prompt": 0.003, "completion": 0.004},
     "gpt-3.5-turbo-1106": {"prompt": 0.001, "completion": 0.002},
+    "gpt-3.5-turbo-0125": {"prompt": 0.001, "completion": 0.002},
     "gpt-4-0314": {"prompt": 0.03, "completion": 0.06},
     "gpt-4": {"prompt": 0.03, "completion": 0.06},
     "gpt-4-32k": {"prompt": 0.06, "completion": 0.12},
     "gpt-4-32k-0314": {"prompt": 0.06, "completion": 0.12},
     "gpt-4-0613": {"prompt": 0.06, "completion": 0.12},
     "gpt-4-turbo-preview": {"prompt": 0.01, "completion": 0.03},
+    "gpt-4-turbo": {"prompt": 0.01, "completion": 0.03},
     "gpt-4-0125-preview": {"prompt": 0.01, "completion": 0.03},
     "gpt-4-1106-preview": {"prompt": 0.01, "completion": 0.03},
     "gpt-4-vision-preview": {"prompt": 0.01, "completion": 0.03},  # TODO add extra image price calculator
@@ -48,6 +50,8 @@
     "claude-2.1": {"prompt": 0.008, "completion": 0.024},
     "claude-3-sonnet-20240229": {"prompt": 0.003, "completion": 0.015},
     "claude-3-opus-20240229": {"prompt": 0.015, "completion": 0.075},
+    "yi-34b-chat-0205": {"prompt": 0.0003, "completion": 0.0003},
+    "yi-34b-chat-200k": {"prompt": 0.0017, "completion": 0.0017},
 }
 
 
@@ -140,25 +144,25 @@
     "mixtral-8x7b": {"prompt": 0.4, "completion": 1.6},
 }
 
+# https://platform.openai.com/docs/models/gpt-4-and-gpt-4-turbo
 TOKEN_MAX = {
-    "gpt-3.5-turbo": 4096,
-    "gpt-3.5-turbo-0301": 4096,
-    "gpt-3.5-turbo-0613": 4096,
-    "gpt-3.5-turbo-16k": 16384,
-    "gpt-3.5-turbo-16k-0613": 16384,
-    "gpt-35-turbo": 4096,
-    "gpt-35-turbo-16k": 16384,
-    "gpt-3.5-turbo-1106": 16384,
-    "gpt-4-0314": 8192,
-    "gpt-4": 8192,
-    "gpt-4-32k": 32768,
-    "gpt-4-32k-0314": 32768,
-    "gpt-4-0613": 8192,
-    "gpt-4-turbo-preview": 128000,
     "gpt-4-0125-preview": 128000,
+    "gpt-4-turbo-preview": 128000,
+    "gpt-4-turbo": 128000,
     "gpt-4-1106-preview": 128000,
     "gpt-4-vision-preview": 128000,
     "gpt-4-1106-vision-preview": 128000,
+    "gpt-4": 8192,
+    "gpt-4-0613": 8192,
+    "gpt-4-32k": 32768,
+    "gpt-4-32k-0613": 32768,
+    "gpt-3.5-turbo-0125": 16385,
+    "gpt-3.5-turbo": 16385,
+    "gpt-3.5-turbo-1106": 16385,
+    "gpt-3.5-turbo-instruct": 4096,
+    "gpt-3.5-turbo-16k": 16385,
+    "gpt-3.5-turbo-0613": 4096,
+    "gpt-3.5-turbo-16k-0613": 16385,
     "text-embedding-ada-002": 8192,
     "glm-3-turbo": 128000,
     "glm-4": 128000,
@@ -176,10 +180,12 @@
     "claude-2.1": 200000,
     "claude-3-sonnet-20240229": 200000,
     "claude-3-opus-20240229": 200000,
+    "yi-34b-chat-0205": 4000,
+    "yi-34b-chat-200k": 200000,
 }
 
 
-def count_message_tokens(messages, model="gpt-3.5-turbo-0613"):
+def count_message_tokens(messages, model="gpt-3.5-turbo-0125"):
     """Return the number of tokens used by a list of messages."""
     try:
         encoding = tiktoken.encoding_for_model(model)
@@ -193,10 +199,12 @@ def count_message_tokens(messages, model="gpt-3.5-turbo-0613"):
         "gpt-35-turbo-16k",
         "gpt-3.5-turbo-16k",
         "gpt-3.5-turbo-1106",
+        "gpt-3.5-turbo-0125",
         "gpt-4-0314",
         "gpt-4-32k-0314",
         "gpt-4-0613",
         "gpt-4-32k-0613",
+        "gpt-4-turbo",
         "gpt-4-turbo-preview",
         "gpt-4-0125-preview",
         "gpt-4-1106-preview",
@@ -209,8 +217,8 @@ def count_message_tokens(messages, model="gpt-3.5-turbo-0613"):
         tokens_per_message = 4  # every message follows <|start|>{role/name}\n{content}<|end|>\n
         tokens_per_name = -1  # if there's a name, the role is omitted
     elif "gpt-3.5-turbo" == model:
-        print("Warning: gpt-3.5-turbo may update over time. Returning num tokens assuming gpt-3.5-turbo-0613.")
-        return count_message_tokens(messages, model="gpt-3.5-turbo-0613")
+        print("Warning: gpt-3.5-turbo may update over time. Returning num tokens assuming gpt-3.5-turbo-0125.")
+        return count_message_tokens(messages, model="gpt-3.5-turbo-0125")
     elif "gpt-4" == model:
         print("Warning: gpt-4 may update over time. Returning num tokens assuming gpt-4-0613.")
         return count_message_tokens(messages, model="gpt-4-0613")
@@ -224,7 +232,7 @@ def count_message_tokens(messages, model="gpt-3.5-turbo-0613"):
     else:
         raise NotImplementedError(
             f"num_tokens_from_messages() is not implemented for model {model}. "
-            f"See https://github.com/openai/openai-python/blob/main/chatml.md "
+            f"See https://cookbook.openai.com/examples/how_to_count_tokens_with_tiktoken "
             f"for information on how messages are converted to tokens."
         )
     num_tokens = 0
diff --git a/metagpt/utils/tree.py b/metagpt/utils/tree.py
new file mode 100644
index 0000000000..bd79222901
--- /dev/null
+++ b/metagpt/utils/tree.py
@@ -0,0 +1,140 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+"""
+@Time    : 2024/3/11
+@Author  : mashenquan
+@File    : tree.py
+@Desc    : Implement the same functionality as the `tree` command.
+        Example:
+            >>> print_tree(".")
+            utils
+            +-- serialize.py
+            +-- project_repo.py
+            +-- tree.py
+            +-- mmdc_playwright.py
+            +-- cost_manager.py
+            +-- __pycache__
+            |   +-- __init__.cpython-39.pyc
+            |   +-- redis.cpython-39.pyc
+            |   +-- singleton.cpython-39.pyc
+            |   +-- embedding.cpython-39.pyc
+            |   +-- make_sk_kernel.cpython-39.pyc
+            |   +-- file_repository.cpython-39.pyc
+            +-- file.py
+            +-- save_code.py
+            +-- common.py
+            +-- redis.py
+"""
+from __future__ import annotations
+
+import subprocess
+from pathlib import Path
+from typing import Callable, Dict, List
+
+from gitignore_parser import parse_gitignore
+
+
+def tree(root: str | Path, gitignore: str | Path = None, run_command: bool = False) -> str:
+    """
+    Recursively traverses the directory structure and prints it out in a tree-like format.
+
+    Args:
+        root (str or Path): The root directory from which to start traversing.
+        gitignore (str or Path): The filename of gitignore file.
+        run_command (bool): Whether to execute `tree` command. Execute the `tree` command and return the result if True,
+            otherwise execute python code instead.
+
+    Returns:
+        str: A string representation of the directory tree.
+
+    Example:
+            >>> tree(".")
+            utils
+            +-- serialize.py
+            +-- project_repo.py
+            +-- tree.py
+            +-- mmdc_playwright.py
+            +-- __pycache__
+            |   +-- __init__.cpython-39.pyc
+            |   +-- redis.cpython-39.pyc
+            |   +-- singleton.cpython-39.pyc
+            +-- parse_docstring.py
+
+            >>> tree(".", gitignore="../../.gitignore")
+            utils
+            +-- serialize.py
+            +-- project_repo.py
+            +-- tree.py
+            +-- mmdc_playwright.py
+            +-- parse_docstring.py
+
+            >>> tree(".", gitignore="../../.gitignore", run_command=True)
+            utils
+            ├── serialize.py
+            ├── project_repo.py
+            ├── tree.py
+            ├── mmdc_playwright.py
+            └── parse_docstring.py
+
+
+    """
+    root = Path(root).resolve()
+    if run_command:
+        return _execute_tree(root, gitignore)
+
+    git_ignore_rules = parse_gitignore(gitignore) if gitignore else None
+    dir_ = {root.name: _list_children(root=root, git_ignore_rules=git_ignore_rules)}
+    v = _print_tree(dir_)
+    return "\n".join(v)
+
+
+def _list_children(root: Path, git_ignore_rules: Callable) -> Dict[str, Dict]:
+    dir_ = {}
+    for i in root.iterdir():
+        if git_ignore_rules and git_ignore_rules(str(i)):
+            continue
+        try:
+            if i.is_file():
+                dir_[i.name] = {}
+            else:
+                dir_[i.name] = _list_children(root=i, git_ignore_rules=git_ignore_rules)
+        except (FileNotFoundError, PermissionError, OSError):
+            dir_[i.name] = {}
+    return dir_
+
+
+def _print_tree(dir_: Dict[str:Dict]) -> List[str]:
+    ret = []
+    for name, children in dir_.items():
+        ret.append(name)
+        if not children:
+            continue
+        lines = _print_tree(children)
+        for j, v in enumerate(lines):
+            if v[0] not in ["+", " ", "|"]:
+                ret = _add_line(ret)
+                row = f"+-- {v}"
+            else:
+                row = f"    {v}"
+            ret.append(row)
+    return ret
+
+
+def _add_line(rows: List[str]) -> List[str]:
+    for i in range(len(rows) - 1, -1, -1):
+        v = rows[i]
+        if v[0] != " ":
+            return rows
+        rows[i] = "|" + v[1:]
+    return rows
+
+
+def _execute_tree(root: Path, gitignore: str | Path) -> str:
+    args = ["--gitfile", str(gitignore)] if gitignore else []
+    try:
+        result = subprocess.run(["tree"] + args + [str(root)], capture_output=True, text=True, check=True)
+        if result.returncode != 0:
+            raise ValueError(f"tree exits with code {result.returncode}")
+        return result.stdout
+    except subprocess.CalledProcessError as e:
+        raise e
diff --git a/requirements.txt b/requirements.txt
index c97d4b2f24..83962b21b9 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,7 +1,6 @@
-aiohttp==3.8.4
+aiohttp==3.8.6
 #azure_storage==0.37.0
 channels==4.0.0
-# chromadb
 # Django==4.1.5
 # docx==0.2.4
 #faiss==1.5.3
@@ -11,15 +10,13 @@ typer==0.9.0
 # godot==0.1.1
 # google_api_python_client==2.93.0  # Used by search_engine.py
 lancedb==0.4.0
-langchain==0.1.8
-sqlalchemy==2.0.0  # along with langchain
 loguru==0.6.0
 meilisearch==0.21.0
-numpy>=1.24.3,<1.25.0
-openai==1.6.0
+numpy==1.24.3
+openai==1.6.1
 openpyxl
-beautifulsoup4==4.12.2
-pandas==2.0.3
+beautifulsoup4==4.12.3
+pandas==2.1.1
 pydantic==2.5.3
 #pygame==2.1.3
 #pymilvus==2.2.8
@@ -29,8 +26,8 @@ PyYAML==6.0.1
 # sentence_transformers==2.2.2
 setuptools==65.6.3
 tenacity==8.2.3
-tiktoken==0.5.2
-tqdm==4.65.0
+tiktoken==0.6.0
+tqdm==4.66.2
 #unstructured[local-inference]
 # selenium>4
 # webdriver_manager<3.9
@@ -61,9 +58,9 @@ typing-extensions==4.9.0
 socksio~=1.0.0
 gitignore-parser==0.1.9
 # connexion[uvicorn]~=3.0.5 # Used by metagpt/tools/openapi_v3_hello.py
-websockets~=12.0
+websockets~=11.0
 networkx~=3.2.1
-google-generativeai==0.3.2
+google-generativeai==0.4.1
 playwright>=1.26  # used at metagpt/tools/libs/web_scraping.py
 anytree
 ipywidgets==8.1.1
@@ -71,4 +68,5 @@ Pillow
 imap_tools==1.5.0  # Used by metagpt/tools/libs/email_login.py
 qianfan==0.3.2
 dashscope==1.14.1
-rank-bm25==0.2.2  # for tool recommendation
\ No newline at end of file
+rank-bm25==0.2.2  # for tool recommendation
+gymnasium==0.29.1
diff --git a/setup.py b/setup.py
index 2044e577a4..e43bf3ed0f 100644
--- a/setup.py
+++ b/setup.py
@@ -27,7 +27,22 @@ def run(self):
     "selenium": ["selenium>4", "webdriver_manager", "beautifulsoup4"],
     "search-google": ["google-api-python-client==2.94.0"],
     "search-ddg": ["duckduckgo-search~=4.1.1"],
-    "ocr": ["paddlepaddle==2.4.2", "paddleocr>=2.0.1", "tabulate==0.9.0"],
+    "ocr": ["paddlepaddle==2.4.2", "paddleocr~=2.7.3", "tabulate==0.9.0"],
+    "rag": [
+        "llama-index-core==0.10.15",
+        "llama-index-embeddings-azure-openai==0.1.6",
+        "llama-index-embeddings-openai==0.1.5",
+        "llama-index-embeddings-gemini==0.1.6",
+        "llama-index-embeddings-ollama==0.1.2",
+        "llama-index-llms-azure-openai==0.1.4",
+        "llama-index-readers-file==0.1.4",
+        "llama-index-retrievers-bm25==0.1.3",
+        "llama-index-vector-stores-faiss==0.1.1",
+        "llama-index-vector-stores-elasticsearch==0.1.6",
+        "llama-index-vector-stores-chroma==0.1.6",
+        "docx2txt==0.8",
+    ],
+    "android_assistant": ["pyshine==0.0.9", "opencv-python==4.6.0.66"],
 }
 
 extras_require["test"] = [
@@ -42,7 +57,6 @@ def run(self):
     "connexion[uvicorn]~=3.0.5",
     "azure-cognitiveservices-speech~=1.31.0",
     "aioboto3~=11.3.0",
-    "chromadb==0.4.14",
     "gradio==3.0.0",
     "grpcio-status==1.48.2",
     "pylint==3.0.3",
@@ -57,7 +71,7 @@ def run(self):
 
 setup(
     name="metagpt",
-    version="0.7.4",
+    version="0.8.0",
     description="The Multi-Agent Framework",
     long_description=long_description,
     long_description_content_type="text/markdown",
@@ -78,4 +92,5 @@ def run(self):
             "metagpt=metagpt.software_company:app",
         ],
     },
+    include_package_data=True,
 )
diff --git a/tests/conftest.py b/tests/conftest.py
index efd782417a..8603c752aa 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -113,12 +113,13 @@ async def pipe(reader, writer):
         while not reader.at_eof():
             writer.write(await reader.read(2048))
         writer.close()
+        await writer.wait_closed()
 
     async def handle_client(reader, writer):
         data = await reader.readuntil(b"\r\n\r\n")
-        print(f"Proxy: {data}")  # checking with capfd fixture
         infos = pattern.match(data)
         host, port = infos.group("host"), infos.group("port")
+        print(f"Proxy: {host}")  # checking with capfd fixture
         port = int(port) if port else 80
         remote_reader, remote_writer = await asyncio.open_connection(host, port)
         if data.startswith(b"CONNECT"):
@@ -257,10 +258,10 @@ async def start():
         server = aiohttp.web.Server(handler)
         runner = aiohttp.web.ServerRunner(server)
         await runner.setup()
-        site = aiohttp.web.TCPSite(runner, "localhost", 0)
+        site = aiohttp.web.TCPSite(runner, "127.0.0.1", 0)
         await site.start()
-        host, port = site._server.sockets[0].getsockname()
-        return site, f"http://{host}:{port}"
+        _, port, *_ = site._server.sockets[0].getsockname()
+        return site, f"http://127.0.0.1:{port}"
 
     return start
 
diff --git a/tests/data/andriod_assistant/.gitignore b/tests/data/andriod_assistant/.gitignore
new file mode 100644
index 0000000000..0230c3f465
--- /dev/null
+++ b/tests/data/andriod_assistant/.gitignore
@@ -0,0 +1,2 @@
+!*.png
+unitest_Contacts
\ No newline at end of file
diff --git a/tests/data/andriod_assistant/demo_Contacts/labeled_screenshots/0_labeled.png b/tests/data/andriod_assistant/demo_Contacts/labeled_screenshots/0_labeled.png
new file mode 100644
index 0000000000..7e60b9a86e
Binary files /dev/null and b/tests/data/andriod_assistant/demo_Contacts/labeled_screenshots/0_labeled.png differ
diff --git a/tests/data/andriod_assistant/demo_Contacts/labeled_screenshots/1_labeled.png b/tests/data/andriod_assistant/demo_Contacts/labeled_screenshots/1_labeled.png
new file mode 100644
index 0000000000..c790e863c1
Binary files /dev/null and b/tests/data/andriod_assistant/demo_Contacts/labeled_screenshots/1_labeled.png differ
diff --git a/tests/data/andriod_assistant/demo_Contacts/record.txt b/tests/data/andriod_assistant/demo_Contacts/record.txt
new file mode 100644
index 0000000000..e0b20e4b3e
--- /dev/null
+++ b/tests/data/andriod_assistant/demo_Contacts/record.txt
@@ -0,0 +1,2 @@
+tap(9):::android.view.ViewGroup_1067_236_android.widget.TextView_183_204_Apps_2
+stop
diff --git a/tests/data/andriod_assistant/demo_Contacts/task_desc.txt b/tests/data/andriod_assistant/demo_Contacts/task_desc.txt
new file mode 100644
index 0000000000..c7e76d8d73
--- /dev/null
+++ b/tests/data/andriod_assistant/demo_Contacts/task_desc.txt
@@ -0,0 +1 @@
+Create a contact in Contacts App named zjy with a phone number +86 18831933368
\ No newline at end of file
diff --git a/tests/data/rsp_cache.json b/tests/data/rsp_cache.json
index 565241779f..772b4d5edf 100644
--- a/tests/data/rsp_cache.json
+++ b/tests/data/rsp_cache.json
@@ -427,5 +427,23 @@
     "As a data scientist, you need to help user to achieve their goal step by step in a continuous Jupyter notebook. Since it is a notebook environment, don't use asyncio.run. Instead, use await if you need to call an async function.#SYSTEM_MSG_END#\n# User Requirement\nRun data analysis on sklearn Wine recognition dataset, include a plot, and train a model to predict wine class (20% as validation), and show validation accuracy.\n\n# Plan Status\n\n## Finished Tasks\n### code\n```python\nimport numpy as np\nimport pandas as pd\nimport matplotlib.pyplot as plt\nfrom sklearn.datasets import load_wine\nwine = load_wine()\nwine_df = pd.DataFrame(data=np.c_[wine['data'], wine['target']],\n                       columns=wine['feature_names'] + ['target'])\nnumerical_summary = wine_df.describe()\ncategorical_summary = wine_df.select_dtypes(include=['object', 'category']).describe()\ncorrelation_matrix = wine_df.corr()\nwine_df.hist(bins=15, figsize=(15, 10), layout=(4, 4))\nplt.tight_layout()\nplt.show()\nprint(\"Numerical Summary:\\n\", numerical_summary)\nprint(\"\\nCategorical Summary:\\n\", categorical_summary)\nprint(\"\\nCorrelation Matrix:\\n\", correlation_matrix)\n\nfrom sklearn.model_selection import train_test_split\nX_train, X_val, y_train, y_val = train_test_split(\n    wine_df.drop('target', axis=1),\n    wine_df['target'],\n    test_size=0.2,\n    random_state=42\n)\nprint(f\"Training set shape: {X_train.shape}\")\nprint(f\"Validation set shape: {X_val.shape}\")\nprint(f\"Training target shape: {y_train.shape}\")\nprint(f\"Validation target shape: {y_val.shape}\")\n\nfrom sklearn.ensemble import RandomForestClassifier\nfrom sklearn.metrics import accuracy_score\nmodel = RandomForestClassifier(n_estimators=100, random_state=42)\nmodel.fit(X_train, y_train)\ny_val_pred = model.predict(X_val)\nval_accuracy = accuracy_score(y_val, y_val_pred)\nprint(f\"Validation Accuracy: {val_accuracy:.4f}\")\n```\n\n### execution result\na successful run\n\na successful run\n\na successful run\n\n## Current Task\nEvaluate the model on the validation set and show the validation accuracy.\n\n## Task Guidance\nWrite complete code for 'Current Task'. And avoid duplicating code from 'Finished Tasks', such as repeated import of packages, reading data, etc.\nSpecifically, \nThe current task is about evaluating a model, please note the following:\n- Ensure that the evaluated data is same processed as the training data. If not, remember use object in 'Done Tasks' to transform the data.\n- Use trained model from previous task result directly, do not mock or reload model yourself.\n\n\n\n# Tool Info\n\n\n# Constraints\n- Take on Current Task if it is in Plan Status, otherwise, tackle User Requirement directly.\n- Ensure the output new code is executable in the same Jupyter notebook as the previous executed code.\n- Always prioritize using pre-defined tools for the same functionality.\n\n# Output\nWhile some concise thoughts are helpful, code is absolutely required. Always output one and only one code block in your response. Output code in the following format:\n```python\nyour code\n```\n": "```python\n# Evaluate the model on the validation set and show the validation accuracy\nval_accuracy = accuracy_score(y_val, y_val_pred)\nprint(f\"Validation Accuracy: {val_accuracy:.4f}\")\n```",
     "user: \n## User Requirement\nRun data analysis on sklearn Wine recognition dataset, include a plot, and train a model to predict wine class (20% as validation), and show validation accuracy.\n## Context\n\n## Current Plan\n[\n    {\n        \"task_id\": \"1\",\n        \"dependent_task_ids\": [],\n        \"instruction\": \"Perform exploratory data analysis on the sklearn Wine recognition dataset including summary statistics and a plot.\",\n        \"task_type\": \"eda\",\n        \"code\": \"import numpy as np\\nimport pandas as pd\\nimport matplotlib.pyplot as plt\\nfrom sklearn.datasets import load_wine\\n\\n# Load the wine dataset\\nwine = load_wine()\\nwine_df = pd.DataFrame(data=np.c_[wine['data'], wine['target']],\\n                       columns=wine['feature_names'] + ['target'])\\n\\n# Summary statistics for numerical features\\nnumerical_summary = wine_df.describe()\\n\\n# Summary statistics for categorical features\\ncategorical_summary = wine_df.select_dtypes(include=['object', 'category']).describe()\\n\\n# Correlation matrix for numerical features\\ncorrelation_matrix = wine_df.corr()\\n\\n# Plotting a histogram for each numerical feature\\nwine_df.hist(bins=15, figsize=(15, 10), layout=(4, 4))\\nplt.tight_layout()\\nplt.show()\\n\\n# Displaying the summary statistics\\nprint(\\\"Numerical Summary:\\\\n\\\", numerical_summary)\\nprint(\\\"\\\\nCategorical Summary:\\\\n\\\", categorical_summary)\\nprint(\\\"\\\\nCorrelation Matrix:\\\\n\\\", correlation_matrix)\\n\",\n        \"result\": \"a successful run\",\n        \"is_success\": true,\n        \"is_finished\": true\n    },\n    {\n        \"task_id\": \"2\",\n        \"dependent_task_ids\": [\n            \"1\"\n        ],\n        \"instruction\": \"Preprocess the dataset by splitting it into training and validation sets with a 80-20 split.\",\n        \"task_type\": \"data preprocessing\",\n        \"code\": \"\",\n        \"result\": \"\",\n        \"is_success\": false,\n        \"is_finished\": false\n    },\n    {\n        \"task_id\": \"3\",\n        \"dependent_task_ids\": [\n            \"2\"\n        ],\n        \"instruction\": \"Train a model using the training set to predict wine class.\",\n        \"task_type\": \"model train\",\n        \"code\": \"\",\n        \"result\": \"\",\n        \"is_success\": false,\n        \"is_finished\": false\n    },\n    {\n        \"task_id\": \"4\",\n        \"dependent_task_ids\": [\n            \"3\"\n        ],\n        \"instruction\": \"Evaluate the model on the validation set and show the validation accuracy.\",\n        \"task_type\": \"model evaluate\",\n        \"code\": \"\",\n        \"result\": \"\",\n        \"is_success\": false,\n        \"is_finished\": false\n    }\n]\n## Current Task\n{\"task_id\":\"2\",\"dependent_task_ids\":[\"1\"],\"instruction\":\"Preprocess the dataset by splitting it into training and validation sets with a 80-20 split.\",\"task_type\":\"data preprocessing\",\"code\":\"\",\"result\":\"\",\"is_success\":false,\"is_finished\":false}\n\nuser: \n# Latest Data Info\nLatest data info after previous tasks:\na successful run\n\nassistant: from sklearn.model_selection import train_test_split\n\n# Split the data into training and validation sets (80-20 split)\nX_train, X_val, y_train, y_val = train_test_split(\n    wine_df.drop('target', axis=1),  # features\n    wine_df['target'],               # target variable\n    test_size=0.2,                   # 20% for validation\n    random_state=42                  # seed for reproducibility\n)\n\n# Output the shapes of the resulting data splits\nprint(f\"Training set shape: {X_train.shape}\")\nprint(f\"Validation set shape: {X_val.shape}\")\nprint(f\"Training target shape: {y_train.shape}\")\nprint(f\"Validation target shape: {y_val.shape}\")\n\nuser: a successful runThis is a <task> review. Please review output from metagpt.actions.di.execute_nb_code.ExecuteNbCode\nIf you want to change, add, delete a task or merge tasks in the plan, say 'change task task_id or current task, ... (things to change)' If you confirm the output from the current task and wish to continue, type: confirmIf you think user requirement has been fulfilled completedly, you can finish the process by typing: finish\nIf you want to terminate the process, type: exit\nPlease type your review below:\n": "confirm",
     "user: \n## User Requirement\nRun data analysis on sklearn Wine recognition dataset, include a plot, and train a model to predict wine class (20% as validation), and show validation accuracy.\n## Context\n\n## Current Plan\n[\n    {\n        \"task_id\": \"1\",\n        \"dependent_task_ids\": [],\n        \"instruction\": \"Perform exploratory data analysis on the sklearn Wine recognition dataset including summary statistics and a plot.\",\n        \"task_type\": \"eda\",\n        \"code\": \"import numpy as np\\nimport pandas as pd\\nimport matplotlib.pyplot as plt\\nfrom sklearn.datasets import load_wine\\n\\n# Load the wine dataset\\nwine = load_wine()\\nwine_df = pd.DataFrame(data=np.c_[wine['data'], wine['target']],\\n                       columns=wine['feature_names'] + ['target'])\\n\\n# Summary statistics for numerical features\\nnumerical_summary = wine_df.describe()\\n\\n# Summary statistics for categorical features\\ncategorical_summary = wine_df.select_dtypes(include=['object', 'category']).describe()\\n\\n# Correlation matrix for numerical features\\ncorrelation_matrix = wine_df.corr()\\n\\n# Plotting a histogram for each numerical feature\\nwine_df.hist(bins=15, figsize=(15, 10), layout=(4, 4))\\nplt.tight_layout()\\nplt.show()\\n\\n# Displaying the summary statistics\\nprint(\\\"Numerical Summary:\\\\n\\\", numerical_summary)\\nprint(\\\"\\\\nCategorical Summary:\\\\n\\\", categorical_summary)\\nprint(\\\"\\\\nCorrelation Matrix:\\\\n\\\", correlation_matrix)\\n\",\n        \"result\": \"a successful run\",\n        \"is_success\": true,\n        \"is_finished\": true\n    },\n    {\n        \"task_id\": \"2\",\n        \"dependent_task_ids\": [\n            \"1\"\n        ],\n        \"instruction\": \"Preprocess the dataset by splitting it into training and validation sets with a 80-20 split.\",\n        \"task_type\": \"data preprocessing\",\n        \"code\": \"from sklearn.model_selection import train_test_split\\n\\n# Split the data into training and validation sets (80-20 split)\\nX_train, X_val, y_train, y_val = train_test_split(\\n    wine_df.drop('target', axis=1),  # features\\n    wine_df['target'],               # target variable\\n    test_size=0.2,                   # 20% for validation\\n    random_state=42                  # seed for reproducibility\\n)\\n\\n# Output the shapes of the resulting data splits\\nprint(f\\\"Training set shape: {X_train.shape}\\\")\\nprint(f\\\"Validation set shape: {X_val.shape}\\\")\\nprint(f\\\"Training target shape: {y_train.shape}\\\")\\nprint(f\\\"Validation target shape: {y_val.shape}\\\")\\n\",\n        \"result\": \"a successful run\",\n        \"is_success\": true,\n        \"is_finished\": true\n    },\n    {\n        \"task_id\": \"3\",\n        \"dependent_task_ids\": [\n            \"2\"\n        ],\n        \"instruction\": \"Train a model using the training set to predict wine class.\",\n        \"task_type\": \"model train\",\n        \"code\": \"\",\n        \"result\": \"\",\n        \"is_success\": false,\n        \"is_finished\": false\n    },\n    {\n        \"task_id\": \"4\",\n        \"dependent_task_ids\": [\n            \"3\"\n        ],\n        \"instruction\": \"Evaluate the model on the validation set and show the validation accuracy.\",\n        \"task_type\": \"model evaluate\",\n        \"code\": \"\",\n        \"result\": \"\",\n        \"is_success\": false,\n        \"is_finished\": false\n    }\n]\n## Current Task\n{\"task_id\":\"3\",\"dependent_task_ids\":[\"2\"],\"instruction\":\"Train a model using the training set to predict wine class.\",\"task_type\":\"model train\",\"code\":\"\",\"result\":\"\",\"is_success\":false,\"is_finished\":false}\n\nuser: \n# Latest Data Info\nLatest data info after previous tasks:\na successful run\n\nassistant: from sklearn.ensemble import RandomForestClassifier\nfrom sklearn.metrics import accuracy_score\n\n# Initialize the RandomForestClassifier\nmodel = RandomForestClassifier(n_estimators=100, random_state=42)\n\n# Train the model on the training data\nmodel.fit(X_train, y_train)\n\n# Predict the wine classes on the validation set\ny_val_pred = model.predict(X_val)\n\n# Calculate the accuracy on the validation set\nval_accuracy = accuracy_score(y_val, y_val_pred)\n\nprint(f\"Validation Accuracy: {val_accuracy:.4f}\")\n\nuser: a successful runThis is a <task> review. Please review output from metagpt.actions.di.execute_nb_code.ExecuteNbCode\nIf you want to change, add, delete a task or merge tasks in the plan, say 'change task task_id or current task, ... (things to change)' If you confirm the output from the current task and wish to continue, type: confirmIf you think user requirement has been fulfilled completedly, you can finish the process by typing: finish\nIf you want to terminate the process, type: exit\nPlease type your review below:\n": "confirm",
-    "user: \n## User Requirement\nRun data analysis on sklearn Wine recognition dataset, include a plot, and train a model to predict wine class (20% as validation), and show validation accuracy.\n## Context\n\n## Current Plan\n[\n    {\n        \"task_id\": \"1\",\n        \"dependent_task_ids\": [],\n        \"instruction\": \"Perform exploratory data analysis on the sklearn Wine recognition dataset including summary statistics and a plot.\",\n        \"task_type\": \"eda\",\n        \"code\": \"import numpy as np\\nimport pandas as pd\\nimport matplotlib.pyplot as plt\\nfrom sklearn.datasets import load_wine\\n\\n# Load the wine dataset\\nwine = load_wine()\\nwine_df = pd.DataFrame(data=np.c_[wine['data'], wine['target']],\\n                       columns=wine['feature_names'] + ['target'])\\n\\n# Summary statistics for numerical features\\nnumerical_summary = wine_df.describe()\\n\\n# Summary statistics for categorical features\\ncategorical_summary = wine_df.select_dtypes(include=['object', 'category']).describe()\\n\\n# Correlation matrix for numerical features\\ncorrelation_matrix = wine_df.corr()\\n\\n# Plotting a histogram for each numerical feature\\nwine_df.hist(bins=15, figsize=(15, 10), layout=(4, 4))\\nplt.tight_layout()\\nplt.show()\\n\\n# Displaying the summary statistics\\nprint(\\\"Numerical Summary:\\\\n\\\", numerical_summary)\\nprint(\\\"\\\\nCategorical Summary:\\\\n\\\", categorical_summary)\\nprint(\\\"\\\\nCorrelation Matrix:\\\\n\\\", correlation_matrix)\\n\",\n        \"result\": \"a successful run\",\n        \"is_success\": true,\n        \"is_finished\": true\n    },\n    {\n        \"task_id\": \"2\",\n        \"dependent_task_ids\": [\n            \"1\"\n        ],\n        \"instruction\": \"Preprocess the dataset by splitting it into training and validation sets with a 80-20 split.\",\n        \"task_type\": \"data preprocessing\",\n        \"code\": \"from sklearn.model_selection import train_test_split\\n\\n# Split the data into training and validation sets (80-20 split)\\nX_train, X_val, y_train, y_val = train_test_split(\\n    wine_df.drop('target', axis=1),  # features\\n    wine_df['target'],               # target variable\\n    test_size=0.2,                   # 20% for validation\\n    random_state=42                  # seed for reproducibility\\n)\\n\\n# Output the shapes of the resulting data splits\\nprint(f\\\"Training set shape: {X_train.shape}\\\")\\nprint(f\\\"Validation set shape: {X_val.shape}\\\")\\nprint(f\\\"Training target shape: {y_train.shape}\\\")\\nprint(f\\\"Validation target shape: {y_val.shape}\\\")\\n\",\n        \"result\": \"a successful run\",\n        \"is_success\": true,\n        \"is_finished\": true\n    },\n    {\n        \"task_id\": \"3\",\n        \"dependent_task_ids\": [\n            \"2\"\n        ],\n        \"instruction\": \"Train a model using the training set to predict wine class.\",\n        \"task_type\": \"model train\",\n        \"code\": \"from sklearn.ensemble import RandomForestClassifier\\nfrom sklearn.metrics import accuracy_score\\n\\n# Initialize the RandomForestClassifier\\nmodel = RandomForestClassifier(n_estimators=100, random_state=42)\\n\\n# Train the model on the training data\\nmodel.fit(X_train, y_train)\\n\\n# Predict the wine classes on the validation set\\ny_val_pred = model.predict(X_val)\\n\\n# Calculate the accuracy on the validation set\\nval_accuracy = accuracy_score(y_val, y_val_pred)\\n\\nprint(f\\\"Validation Accuracy: {val_accuracy:.4f}\\\")\\n\",\n        \"result\": \"a successful run\",\n        \"is_success\": true,\n        \"is_finished\": true\n    },\n    {\n        \"task_id\": \"4\",\n        \"dependent_task_ids\": [\n            \"3\"\n        ],\n        \"instruction\": \"Evaluate the model on the validation set and show the validation accuracy.\",\n        \"task_type\": \"model evaluate\",\n        \"code\": \"\",\n        \"result\": \"\",\n        \"is_success\": false,\n        \"is_finished\": false\n    }\n]\n## Current Task\n{\"task_id\":\"4\",\"dependent_task_ids\":[\"3\"],\"instruction\":\"Evaluate the model on the validation set and show the validation accuracy.\",\"task_type\":\"model evaluate\",\"code\":\"\",\"result\":\"\",\"is_success\":false,\"is_finished\":false}\n\nassistant: # Evaluate the model on the validation set and show the validation accuracy\nval_accuracy = accuracy_score(y_val, y_val_pred)\nprint(f\"Validation Accuracy: {val_accuracy:.4f}\")\n\nuser: a successful runThis is a <task> review. Please review output from metagpt.actions.di.execute_nb_code.ExecuteNbCode\nIf you want to change, add, delete a task or merge tasks in the plan, say 'change task task_id or current task, ... (things to change)' If you confirm the output from the current task and wish to continue, type: confirmIf you think user requirement has been fulfilled completedly, you can finish the process by typing: finish\nIf you want to terminate the process, type: exit\nPlease type your review below:\n": "confirm"
+    "user: \n## User Requirement\nRun data analysis on sklearn Wine recognition dataset, include a plot, and train a model to predict wine class (20% as validation), and show validation accuracy.\n## Context\n\n## Current Plan\n[\n    {\n        \"task_id\": \"1\",\n        \"dependent_task_ids\": [],\n        \"instruction\": \"Perform exploratory data analysis on the sklearn Wine recognition dataset including summary statistics and a plot.\",\n        \"task_type\": \"eda\",\n        \"code\": \"import numpy as np\\nimport pandas as pd\\nimport matplotlib.pyplot as plt\\nfrom sklearn.datasets import load_wine\\n\\n# Load the wine dataset\\nwine = load_wine()\\nwine_df = pd.DataFrame(data=np.c_[wine['data'], wine['target']],\\n                       columns=wine['feature_names'] + ['target'])\\n\\n# Summary statistics for numerical features\\nnumerical_summary = wine_df.describe()\\n\\n# Summary statistics for categorical features\\ncategorical_summary = wine_df.select_dtypes(include=['object', 'category']).describe()\\n\\n# Correlation matrix for numerical features\\ncorrelation_matrix = wine_df.corr()\\n\\n# Plotting a histogram for each numerical feature\\nwine_df.hist(bins=15, figsize=(15, 10), layout=(4, 4))\\nplt.tight_layout()\\nplt.show()\\n\\n# Displaying the summary statistics\\nprint(\\\"Numerical Summary:\\\\n\\\", numerical_summary)\\nprint(\\\"\\\\nCategorical Summary:\\\\n\\\", categorical_summary)\\nprint(\\\"\\\\nCorrelation Matrix:\\\\n\\\", correlation_matrix)\\n\",\n        \"result\": \"a successful run\",\n        \"is_success\": true,\n        \"is_finished\": true\n    },\n    {\n        \"task_id\": \"2\",\n        \"dependent_task_ids\": [\n            \"1\"\n        ],\n        \"instruction\": \"Preprocess the dataset by splitting it into training and validation sets with a 80-20 split.\",\n        \"task_type\": \"data preprocessing\",\n        \"code\": \"from sklearn.model_selection import train_test_split\\n\\n# Split the data into training and validation sets (80-20 split)\\nX_train, X_val, y_train, y_val = train_test_split(\\n    wine_df.drop('target', axis=1),  # features\\n    wine_df['target'],               # target variable\\n    test_size=0.2,                   # 20% for validation\\n    random_state=42                  # seed for reproducibility\\n)\\n\\n# Output the shapes of the resulting data splits\\nprint(f\\\"Training set shape: {X_train.shape}\\\")\\nprint(f\\\"Validation set shape: {X_val.shape}\\\")\\nprint(f\\\"Training target shape: {y_train.shape}\\\")\\nprint(f\\\"Validation target shape: {y_val.shape}\\\")\\n\",\n        \"result\": \"a successful run\",\n        \"is_success\": true,\n        \"is_finished\": true\n    },\n    {\n        \"task_id\": \"3\",\n        \"dependent_task_ids\": [\n            \"2\"\n        ],\n        \"instruction\": \"Train a model using the training set to predict wine class.\",\n        \"task_type\": \"model train\",\n        \"code\": \"from sklearn.ensemble import RandomForestClassifier\\nfrom sklearn.metrics import accuracy_score\\n\\n# Initialize the RandomForestClassifier\\nmodel = RandomForestClassifier(n_estimators=100, random_state=42)\\n\\n# Train the model on the training data\\nmodel.fit(X_train, y_train)\\n\\n# Predict the wine classes on the validation set\\ny_val_pred = model.predict(X_val)\\n\\n# Calculate the accuracy on the validation set\\nval_accuracy = accuracy_score(y_val, y_val_pred)\\n\\nprint(f\\\"Validation Accuracy: {val_accuracy:.4f}\\\")\\n\",\n        \"result\": \"a successful run\",\n        \"is_success\": true,\n        \"is_finished\": true\n    },\n    {\n        \"task_id\": \"4\",\n        \"dependent_task_ids\": [\n            \"3\"\n        ],\n        \"instruction\": \"Evaluate the model on the validation set and show the validation accuracy.\",\n        \"task_type\": \"model evaluate\",\n        \"code\": \"\",\n        \"result\": \"\",\n        \"is_success\": false,\n        \"is_finished\": false\n    }\n]\n## Current Task\n{\"task_id\":\"4\",\"dependent_task_ids\":[\"3\"],\"instruction\":\"Evaluate the model on the validation set and show the validation accuracy.\",\"task_type\":\"model evaluate\",\"code\":\"\",\"result\":\"\",\"is_success\":false,\"is_finished\":false}\n\nassistant: # Evaluate the model on the validation set and show the validation accuracy\nval_accuracy = accuracy_score(y_val, y_val_pred)\nprint(f\"Validation Accuracy: {val_accuracy:.4f}\")\n\nuser: a successful runThis is a <task> review. Please review output from metagpt.actions.di.execute_nb_code.ExecuteNbCode\nIf you want to change, add, delete a task or merge tasks in the plan, say 'change task task_id or current task, ... (things to change)' If you confirm the output from the current task and wish to continue, type: confirmIf you think user requirement has been fulfilled completedly, you can finish the process by typing: finish\nIf you want to terminate the process, type: exit\nPlease type your review below:\n": "confirm",
+    "\"\"\"\nGiven only the information above, what are 3 most salient high-level questions we can answer about the subjects grounded in the statements?\n1)\n\"\"\"\nOutput the response to the prompt above in json. Output must be a list of str.\nExample output json:\n{\"output\": \"[\"What should Jane do for lunch\", \"Does Jane like strawberry\", \"Who is Jane\"]\"}": "{\n  \"output\": [\n    \"What is the significance of the information provided?\",\n    \"What are the implications of Jane's preferences?\",\n    \"How does the information relate to the subject's identity?\"\n  ]\n}",
+    "Input:\n[user: Klaus Mueller has a close relationship with Maria Lopez, user:s Mueller and Maria Lopez have a close relationship, user: Klaus Mueller has a close relationship with Maria Lopez, user: Klaus Mueller has a close relationship with Maria Lopez, user: Klaus Mueller and Maria Lopez have a strong relationship, user: Klaus Mueller is a dormmate of Maria Lopez., user: Klaus Mueller and Maria Lopez have a strong bond, user: Klaus Mueller has a crush on Maria Lopez, user: Klaus Mueller and Maria Lopez have been friends for more than 2 years., user: Klaus Mueller has a close relationship with Maria Lopez, user: Klaus Mueller Maria Lopez is heading off to college., user: Klaus Mueller and Maria Lopez have a close relationship, user: Klaus Mueller is actively researching a topic, user: Klaus Mueller is close friends and classmates with Maria Lopez., user: Klaus Mueller is socially active, user: Klaus Mueller has a crush on Maria Lopez., user: Klaus Mueller and Maria Lopez have been friends for a long time, user: Klaus Mueller is academically inclined, user: For Klaus Mueller's planning: should remember to ask Maria Lopez about her research paper, as she found it interesting that he mentioned it., user: Klaus Mueller is acquainted with Isabella Rodriguez, user: Klaus Mueller is organized and prepared, user: Maria Lopez is conversing about conversing about Maria's research paper mentioned by Klaus, user: Klaus Mueller is conversing about conversing about Maria's research paper mentioned by Klaus, user: Klaus Mueller is a student, user: Klaus Mueller is a student, user: Klaus Mueller is conversing about two friends named Klaus Mueller and Maria Lopez discussing their morning plans and progress on a research paper before Maria heads off to college., user: Klaus Mueller is socially active, user: Klaus Mueller is socially active, user: Klaus Mueller is socially active and acquainted with Isabella Rodriguez, user: Klaus Mueller has a crush on Maria Lopez]\n\nWhat 5 high-level insights can you infer from the above statements? Please ensure it includes 'because of' and generates according to the example format.(example format: insight (because of 1, 5, 3)) .\n1.": "It seems that Klaus Mueller has a strong and close relationship with Maria Lopez because they have been friends for more than 2 years, are dormmates, and have a strong bond.\n2. Klaus Mueller is academically inclined and actively researching a topic because he is conversing about Maria's research paper and is organized and prepared.\n3. Klaus Mueller has a crush on Maria Lopez, which is evident from his repeated mention of their close relationship and his interest in her research paper.\n4. Klaus Mueller is socially active and acquainted with Isabella Rodriguez, as he is conversing about two friends discussing their morning plans and progress on a research paper before Maria heads off to college.\n5. Maria Lopez and Klaus Mueller are conversing about their morning plans and",
+    "Task: Turn the input into (subject, predicate, object). \n\nInput: Sam Johnson is eating breakfast. \nOutput: (Dolores Murphy, eat, breakfast) \n--- \nInput: Joon Park is brewing coffee.\nOutput: (Joon Park, brew, coffee)\n---\nInput: Jane Cook is sleeping. \nOutput: (Jane Cook, is, sleep)\n---\nInput: Michael Bernstein is writing email on a computer. \nOutput: (Michael Bernstein, write, email)\n---\nInput: Percy Liang is teaching students in a classroom. \nOutput: (Percy Liang, teach, students)\n---\nInput: Merrie Morris is running on a treadmill. \nOutput: (Merrie Morris, run, treadmill)\n---\nInput: Klaus Mueller is Klaus Mueller is academically inclined. \nOutput: (Klaus Mueller,": "I'm sorry, but the input \"Klaus Mueller is Klaus Mueller is academically inclined.\" seems to be incomplete or incorrect. Could you please",
+    "\"\"\"\nConversation: \nRole_A: \"what's the weather today?\"\nRole_B: \"It looks pretty good, and I will take a walk then.\"\n\n\nSummarize the conversation above in one sentence:\nThis is a conversation about\n\"\"\"\nOutput the response to the prompt above in json. The output must continue the sentence above by filling in the <fill in> tag. Don't start with 'this is a conversation about...' Just finish the sentence but do not miss any important details (including who are chatting).\nExample output json:\n{\"output\": \"conversing about what to eat for lunch\"}": "{\"output\": \"the weather and plans for a walk\"}",
+    "\"\"\"\n[Statements]\n\n\nBased on the statements above, summarize Isabella Rodriguez and Klaus Mueller's relationship. What do they feel or know about each other?\n\n\n\"\n\"\"\"\nOutput the response to the prompt above in json. The output should be a string that responds to the question.\nExample output json:\n{\"output\": \"Jane Doe is working on a project\"}": "{\"output\": \"Isabella Rodriguez and Klaus Mueller have a close working relationship and seem to have a good understanding of each other's strengths and weaknesses. They trust each other and are comfortable sharing their thoughts and ideas.\"}",
+    "Context for the task: \n\nPART 1. \nHere is Here is a brief description of Isabella Rodriguez.\nName: Isabella Rodriguez\nAge: 34\nInnate traits: friendly, outgoing, hospitable\nLearned traits: Isabella Rodriguez is a cafe owner of Hobbs Cafe who loves to make people feel welcome. She is always looking for ways to make the cafe a place where people can come to relax and enjoy themselves.\nCurrently: Isabella Rodriguez is planning on having a Valentine's Day party at Hobbs Cafe with her customers on February 14th, 2023 at 5pm. She is gathering party material, and is telling everyone to join the party at Hobbs Cafe on February 14th, 2023, from 5pm to 7pm.\nLifestyle: Isabella Rodriguez goes to bed around 11pm, awakes up around 6am.\nDaily plan requirement: Isabella Rodriguez opens Hobbs Cafe at 8am everyday, and works at the counter until 8pm, at which point she closes the cafe.\nCurrent Date: \n\n\nHere is the memory that is in Isabella Rodriguez's head: \n\n\nPART 2. \nPast Context: \n\n\nCurrent Location: main room in Isabella Rodriguez's apartment\n\nCurrent Context: \nIsabella Rodriguez was None when Isabella Rodriguez saw Klaus Mueller in the middle of None.\nIsabella Rodriguez is initiating a conversation with Klaus Mueller.\n\nIsabella Rodriguez and Klaus Mueller are chatting. Here is their conversation so far: \n[The conversation has not started yet -- start it!]\n\n---\nTask: Given the above, what should Isabella Rodriguez say to Klaus Mueller next in the conversation? And did it end the conversation?\n\nOutput format: Output a json of the following format: \n{\n\"Isabella Rodriguez\": \"<Isabella Rodriguez's utterance>\",\n\"Did the conversation end with Isabella Rodriguez's utterance?\": \"<json Boolean>\"\n}": "{\n  \"Isabella Rodriguez\": \"Hey Klaus, I'm so glad you stopped by! I'm getting everything ready for our Valentine's Day party at Hobbs Cafe. I hope you can make it on February 14th at 5pm. It's going to be a great time with music, food, and fun activities. I'd love to see you there!\",\n  \"Did the conversation end with Isabella Rodriguez's utterance?\": \"false\"\n}",
+    "\"\"\"\n[Statements]\n\n\nBased on the statements above, summarize Klaus Mueller and Isabella Rodriguez's relationship. What do they feel or know about each other?\n\n\n\"\n\"\"\"\nOutput the response to the prompt above in json. The output should be a string that responds to the question.\nExample output json:\n{\"output\": \"Jane Doe is working on a project\"}": "{\"output\": \"Klaus Mueller and Isabella Rodriguez have a professional relationship, and they seem to have mutual respect for each other's work. They have collaborated on several projects and have a good understanding of each other's expertise.\"}",
+    "Context for the task: \n\nPART 1. \nHere is Here is a brief description of Klaus Mueller.\nName: Klaus Mueller\nAge: 20\nInnate traits: kind, inquisitive, passionate\nLearned traits: Klaus Mueller is a student at Oak Hill College studying sociology. He is passionate about social justice and loves to explore different perspectives.\nCurrently: Klaus Mueller is writing a research paper on the effects of gentrification in low-income communities.\nLifestyle: Klaus Mueller goes to bed around 11pm, awakes up around 7am, eats dinner around 5pm.\nDaily plan requirement: Klaus Mueller goes to the library at Oak Hill College early in the morning, spends his days writing, and eats at Hobbs Cafe.\nCurrent Date: \n\n\nHere is the memory that is in Klaus Mueller's head: \n\n\nPART 2. \nPast Context: \n\n\nCurrent Location: Klaus Mueller's room in Dorm for Oak Hill College\n\nCurrent Context: \nKlaus Mueller was None when Klaus Mueller saw Isabella Rodriguez in the middle of None.\nKlaus Mueller is initiating a conversation with Isabella Rodriguez.\n\nKlaus Mueller and Isabella Rodriguez are chatting. Here is their conversation so far: \nIsabella Rodriguez: Hey Klaus, I'm so glad you stopped by! I'm getting everything ready for our Valentine's Day party at Hobbs Cafe. I hope you can make it on February 14th at 5pm. It's going to be a great time with music, food, and fun activities. I'd love to see you there!\n\n\n---\nTask: Given the above, what should Klaus Mueller say to Isabella Rodriguez next in the conversation? And did it end the conversation?\n\nOutput format: Output a json of the following format: \n{\n\"Klaus Mueller\": \"<Klaus Mueller's utterance>\",\n\"Did the conversation end with Klaus Mueller's utterance?\": \"<json Boolean>\"\n}": "{\n  \"Klaus Mueller\": \"Hey Isabella, that sounds like a fantastic event! I'll definitely be there on February 14th at 5pm. Thanks for inviting me!\",\n  \"Did the conversation end with Klaus Mueller's utterance?\": \"false\"\n}",
+    "Context for the task: \n\nPART 1. \nHere is Here is a brief description of Isabella Rodriguez.\nName: Isabella Rodriguez\nAge: 34\nInnate traits: friendly, outgoing, hospitable\nLearned traits: Isabella Rodriguez is a cafe owner of Hobbs Cafe who loves to make people feel welcome. She is always looking for ways to make the cafe a place where people can come to relax and enjoy themselves.\nCurrently: Isabella Rodriguez is planning on having a Valentine's Day party at Hobbs Cafe with her customers on February 14th, 2023 at 5pm. She is gathering party material, and is telling everyone to join the party at Hobbs Cafe on February 14th, 2023, from 5pm to 7pm.\nLifestyle: Isabella Rodriguez goes to bed around 11pm, awakes up around 6am.\nDaily plan requirement: Isabella Rodriguez opens Hobbs Cafe at 8am everyday, and works at the counter until 8pm, at which point she closes the cafe.\nCurrent Date: \n\n\nHere is the memory that is in Isabella Rodriguez's head: \n\n\nPART 2. \nPast Context: \n\n\nCurrent Location: main room in Isabella Rodriguez's apartment\n\nCurrent Context: \nIsabella Rodriguez was None when Isabella Rodriguez saw Klaus Mueller in the middle of None.\nIsabella Rodriguez is initiating a conversation with Klaus Mueller.\n\nIsabella Rodriguez and Klaus Mueller are chatting. Here is their conversation so far: \nIsabella Rodriguez: Hey Klaus, I'm so glad you stopped by! I'm getting everything ready for our Valentine's Day party at Hobbs Cafe. I hope you can make it on February 14th at 5pm. It's going to be a great time with music, food, and fun activities. I'd love to see you there!\nKlaus Mueller: Hey Isabella, that sounds like a fantastic event! I'll definitely be there on February 14th at 5pm. Thanks for inviting me!\n\n\n---\nTask: Given the above, what should Isabella Rodriguez say to Klaus Mueller next in the conversation? And did it end the conversation?\n\nOutput format: Output a json of the following format: \n{\n\"Isabella Rodriguez\": \"<Isabella Rodriguez's utterance>\",\n\"Did the conversation end with Isabella Rodriguez's utterance?\": \"<json Boolean>\"\n}": "{\n  \"Isabella Rodriguez\": \"Great! I'm looking forward to seeing you there. I'll make sure to save you a seat. Thanks for stopping by, Klaus!\",\n  \"Did the conversation end with Isabella Rodriguez's utterance?\": \"false\"\n}",
+    "Context for the task: \n\nPART 1. \nHere is Here is a brief description of Klaus Mueller.\nName: Klaus Mueller\nAge: 20\nInnate traits: kind, inquisitive, passionate\nLearned traits: Klaus Mueller is a student at Oak Hill College studying sociology. He is passionate about social justice and loves to explore different perspectives.\nCurrently: Klaus Mueller is writing a research paper on the effects of gentrification in low-income communities.\nLifestyle: Klaus Mueller goes to bed around 11pm, awakes up around 7am, eats dinner around 5pm.\nDaily plan requirement: Klaus Mueller goes to the library at Oak Hill College early in the morning, spends his days writing, and eats at Hobbs Cafe.\nCurrent Date: \n\n\nHere is the memory that is in Klaus Mueller's head: \n\n\nPART 2. \nPast Context: \n\n\nCurrent Location: Klaus Mueller's room in Dorm for Oak Hill College\n\nCurrent Context: \nKlaus Mueller was None when Klaus Mueller saw Isabella Rodriguez in the middle of None.\nKlaus Mueller is initiating a conversation with Isabella Rodriguez.\n\nKlaus Mueller and Isabella Rodriguez are chatting. Here is their conversation so far: \nIsabella Rodriguez: Hey Klaus, I'm so glad you stopped by! I'm getting everything ready for our Valentine's Day party at Hobbs Cafe. I hope you can make it on February 14th at 5pm. It's going to be a great time with music, food, and fun activities. I'd love to see you there!\nKlaus Mueller: Hey Isabella, that sounds like a fantastic event! I'll definitely be there on February 14th at 5pm. Thanks for inviting me!\nIsabella Rodriguez: Great! I'm looking forward to seeing you there. I'll make sure to save you a seat. Thanks for stopping by, Klaus!\n\n\n---\nTask: Given the above, what should Klaus Mueller say to Isabella Rodriguez next in the conversation? And did it end the conversation?\n\nOutput format: Output a json of the following format: \n{\n\"Klaus Mueller\": \"<Klaus Mueller's utterance>\",\n\"Did the conversation end with Klaus Mueller's utterance?\": \"<json Boolean>\"\n}": "{\n  \"Klaus Mueller\": \"Isabella, I'm really interested in your work with the community. I'd love to hear more about it sometime.\",\n  \"Did the conversation end with Klaus Mueller's utterance?\": \"false\"\n}",
+    "Task -- choose an appropriate area  from the area options for a task at hand. \n\nSam Kim lives in {Sam Kim's house} that has Sam Kim's room, bathroom, kitchen.\nSam Kim is currently in {Sam Kim's house} that has Sam Kim's room, bathroom, kitchen. \nArea options: {Sam Kim's house, The Rose and Crown Pub, Hobbs Cafe, Oak Hill College, Johnson Park, Harvey Oak Supply Store, The Willows Market and Pharmacy}.\n* Stay in the current area if the activity can be done there. Only go out if the activity needs to take place in another place.\n* Must be one of the \"Area options,\" verbatim.\nFor taking a walk, Sam Kim should go to the following area: {Johnson Park}\n---\nJane Anderson lives in {Oak Hill College Student Dormatory} that has Jane Anderson's room.\nJane Anderson is currently in {Oak Hill College} that has a classroom, library\nArea options: {Oak Hill College Student Dormatory, The Rose and Crown Pub, Hobbs Cafe, Oak Hill College, Johnson Park, Harvey Oak Supply Store, The Willows Market and Pharmacy}. \n* Stay in the current area if the activity can be done there. Only go out if the activity needs to take place in another place.\n* Must be one of the \"Area options,\" verbatim.\nFor eating dinner, Jane Anderson should go to the following area: {Hobbs Cafe}\n---\nHobbs Cafe lives in {Klaus Mueller} that has sleeping.\nsleeping is currently in {Klaus Mueller} that has !<INPUT 5>!. !<INPUT 6>!\nArea options: {!<INPUT 7>!}. \n* Stay in the current area if the activity can be done there. Only go out if the activity needs to take place in another place.\n* Must be one of the \"Area options,\" verbatim.\n!<INPUT 8>! is !<INPUT 9>!. For !<INPUT 10>!, !<INPUT 11>! should go to the following area: {": "For sleeping, Hobbs Cafe should go to the following area: {K",
+    "Jane Anderson is in kitchen in Jane Anderson's house.\nJane Anderson is going to Jane Anderson's house that has the following areas: {kitchen,  bedroom, bathroom}\nStay in the current area if the activity can be done there. Never go into other people's rooms unless necessary.\nFor cooking, Jane Anderson should go to the following area in Jane Anderson's house:\nAnswer: {kitchen}\n---\nTom Watson is in common room in Tom Watson's apartment. \nTom Watson is going to Hobbs Cafe that has the following areas: {cafe}\nStay in the current area if the activity can be done there. Never go into other people's rooms unless necessary.\nFor getting coffee, Tom Watson should go to the following area in Hobbs Cafe:\nAnswer: {cafe}\n---\n\nKlaus Mueller is going to Dorm for Oak Hill College that has the following areas: {garden, Klaus Mueller's room, woman's bathroom, common room, man's bathroom}\n* Stay in the current area if the activity can be done there. \n* NEVER go into other people's rooms unless necessary.\nKlaus Mueller is sleeping. For sleeping, Klaus Mueller should go to the following area in Dorm for Oak Hill College (MUST pick one of {garden, Klaus Mueller's room, woman's bathroom, common room, man's bathroom}):\nAnswer: {": "Klaus Mueller's room}",
+    "Current activity: sleep in bed\nObjects available: {bed, easel, closet, painting}\nPick ONE most relevant object from the objects available: bed\n---\nCurrent activity: painting\nObjects available: {easel, closet, sink, microwave}\nPick ONE most relevant object from the objects available: easel\n---\nCurrent activity: cooking\nObjects available: {stove, sink, fridge, counter}\nPick ONE most relevant object from the objects available: stove\n---\nCurrent activity: watch TV\nObjects available: {couch, TV, remote, coffee table}\nPick ONE most relevant object from the objects available: TV\n---\nCurrent activity: study\nObjects available: {desk, computer, chair, bookshelf}\nPick ONE most relevant object from the objects available: desk\n---\nCurrent activity: talk on the phone\nObjects available: {phone, charger, bed, nightstand}\nPick ONE most relevant object from the objects available: phone\n---\nCurrent activity: sleeping\nObjects available: {bed, game console, closet, desk}\nPick ONE most relevant object from the objects available:": "bed",
+    "\"\"\"\nTask: We want to understand the state of an object that is being used by someone. \n\nLet's think step by step. \nWe want to know about bed's state. \nStep 1. Klaus Mueller is at/using the sleeping.\nStep 2. Describe the bed's state: bed is\n\"\"\"\nOutput the response to the prompt above in json. The output should ONLY contain the phrase that should go in <fill in>.\nExample output json:\n{\"output\": \"being fixed\"}": "{\n    \"output\": \"being used\"\n}",
+    "\"\"\"\nConvert an action description to an emoji (important: use two or less emojis).\n\nAction description: sleeping\nEmoji:\n\"\"\"\nOutput the response to the prompt above in json. The value for the output must ONLY contain the emojis.\nExample output json:\n{\"output\": \"🛁🧖‍♀️\"}": "{\n    \"output\": \"😴\"\n}",
+    "Task: Turn the input into (subject, predicate, object). \n\nInput: Sam Johnson is eating breakfast. \nOutput: (Dolores Murphy, eat, breakfast) \n--- \nInput: Joon Park is brewing coffee.\nOutput: (Joon Park, brew, coffee)\n---\nInput: Jane Cook is sleeping. \nOutput: (Jane Cook, is, sleep)\n---\nInput: Michael Bernstein is writing email on a computer. \nOutput: (Michael Bernstein, write, email)\n---\nInput: Percy Liang is teaching students in a classroom. \nOutput: (Percy Liang, teach, students)\n---\nInput: Merrie Morris is running on a treadmill. \nOutput: (Merrie Morris, run, treadmill)\n---\nInput: Klaus Mueller is sleeping. \nOutput: (Klaus Mueller,": "I'm sorry, but it seems like the input was cut off. Could you please provide the complete input so I can help you with the output?",
+    "\"\"\"\nConvert an action description to an emoji (important: use two or less emojis).\n\nAction description: being used\nEmoji:\n\"\"\"\nOutput the response to the prompt above in json. The value for the output must ONLY contain the emojis.\nExample output json:\n{\"output\": \"🛁🧖‍♀️\"}": "{\n    \"output\": \"🔨\"\n}",
+    "Task: Turn the input into (subject, predicate, object). \n\nInput: Sam Johnson is eating breakfast. \nOutput: (Dolores Murphy, eat, breakfast) \n--- \nInput: Joon Park is brewing coffee.\nOutput: (Joon Park, brew, coffee)\n---\nInput: Jane Cook is sleeping. \nOutput: (Jane Cook, is, sleep)\n---\nInput: Michael Bernstein is writing email on a computer. \nOutput: (Michael Bernstein, write, email)\n---\nInput: Percy Liang is teaching students in a classroom. \nOutput: (Percy Liang, teach, students)\n---\nInput: Merrie Morris is running on a treadmill. \nOutput: (Merrie Morris, run, treadmill)\n---\nInput: bed is being used. \nOutput: (bed,": "I'm sorry, but the input \"bed is being used\" does not follow the format of the previous examples where a subject, predicate, and object"
 }
\ No newline at end of file
diff --git a/tests/metagpt/actions/test_rebuild_sequence_view.py b/tests/metagpt/actions/test_rebuild_sequence_view.py
index 0e10e37762..9be3e8a995 100644
--- a/tests/metagpt/actions/test_rebuild_sequence_view.py
+++ b/tests/metagpt/actions/test_rebuild_sequence_view.py
@@ -18,6 +18,7 @@
 from metagpt.utils.graph_repository import SPO
 
 
+@pytest.mark.skip
 @pytest.mark.asyncio
 async def test_rebuild(context, mocker):
     # Mock
diff --git a/tests/metagpt/document_store/test_chromadb_store.py b/tests/metagpt/document_store/test_chromadb_store.py
index fd115dcdde..70b30d8143 100644
--- a/tests/metagpt/document_store/test_chromadb_store.py
+++ b/tests/metagpt/document_store/test_chromadb_store.py
@@ -12,7 +12,7 @@
 def test_chroma_store():
     """FIXME：chroma使用感觉很诡异，一用Python就挂，测试用例里也是"""
     # 创建 ChromaStore 实例，使用 'sample_collection' 集合
-    document_store = ChromaStore("sample_collection_1")
+    document_store = ChromaStore("sample_collection_1", get_or_create=True)
 
     # 使用 write 方法添加多个文档
     document_store.write(
diff --git a/tests/metagpt/document_store/test_faiss_store.py b/tests/metagpt/document_store/test_faiss_store.py
index 397ba6ce52..a93b5f1455 100644
--- a/tests/metagpt/document_store/test_faiss_store.py
+++ b/tests/metagpt/document_store/test_faiss_store.py
@@ -6,8 +6,6 @@
 @File    : test_faiss_store.py
 """
 
-from typing import Optional
-
 import numpy as np
 import pytest
 
@@ -17,18 +15,24 @@
 from metagpt.roles import Sales
 
 
-def mock_openai_embed_documents(self, texts: list[str], chunk_size: Optional[int] = 0) -> list[list[float]]:
+def mock_openai_embed_documents(self, texts: list[str], show_progress: bool = False) -> list[list[float]]:
     num = len(texts)
     embeds = np.random.randint(1, 100, size=(num, 1536))  # 1536: openai embedding dim
-    embeds = (embeds - embeds.mean(axis=0)) / (embeds.std(axis=0))
-    return embeds
+    embeds = (embeds - embeds.mean(axis=0)) / embeds.std(axis=0)
+    return embeds.tolist()
+
+
+def mock_openai_embed_document(self, text: str) -> list[float]:
+    embeds = mock_openai_embed_documents(self, [text])
+    return embeds[0]
 
 
 @pytest.mark.asyncio
 async def test_search_json(mocker):
-    mocker.patch("langchain_community.embeddings.openai.OpenAIEmbeddings.embed_documents", mock_openai_embed_documents)
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embeddings", mock_openai_embed_documents)
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embedding", mock_openai_embed_document)
 
-    store = FaissStore(EXAMPLE_PATH / "example.json")
+    store = FaissStore(EXAMPLE_PATH / "data/search_kb/example.json")
     role = Sales(profile="Sales", store=store)
     query = "Which facial cleanser is good for oily skin?"
     result = await role.run(query)
@@ -37,9 +41,10 @@ async def test_search_json(mocker):
 
 @pytest.mark.asyncio
 async def test_search_xlsx(mocker):
-    mocker.patch("langchain_community.embeddings.openai.OpenAIEmbeddings.embed_documents", mock_openai_embed_documents)
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embeddings", mock_openai_embed_documents)
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embedding", mock_openai_embed_document)
 
-    store = FaissStore(EXAMPLE_PATH / "example.xlsx")
+    store = FaissStore(EXAMPLE_PATH / "data/search_kb/example.xlsx", meta_col="Answer", content_col="Question")
     role = Sales(profile="Sales", store=store)
     query = "Which facial cleanser is good for oily skin?"
     result = await role.run(query)
@@ -48,9 +53,10 @@ async def test_search_xlsx(mocker):
 
 @pytest.mark.asyncio
 async def test_write(mocker):
-    mocker.patch("langchain_community.embeddings.openai.OpenAIEmbeddings.embed_documents", mock_openai_embed_documents)
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embeddings", mock_openai_embed_documents)
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embedding", mock_openai_embed_document)
 
-    store = FaissStore(EXAMPLE_PATH / "example.xlsx", meta_col="Answer", content_col="Question")
+    store = FaissStore(EXAMPLE_PATH / "data/search_kb/example.xlsx", meta_col="Answer", content_col="Question")
     _faiss_store = store.write()
-    assert _faiss_store.docstore
-    assert _faiss_store.index
+    assert _faiss_store.storage_context.docstore
+    assert _faiss_store.storage_context.vector_store.client
diff --git a/tests/metagpt/environment/android_env/test_android_ext_env.py b/tests/metagpt/environment/android_env/test_android_ext_env.py
index c9dfc718b5..937cf5f6ef 100644
--- a/tests/metagpt/environment/android_env/test_android_ext_env.py
+++ b/tests/metagpt/environment/android_env/test_android_ext_env.py
@@ -4,8 +4,8 @@
 
 from pathlib import Path
 
-from metagpt.environment.android_env.android_ext_env import AndroidExtEnv
-from metagpt.environment.android_env.const import ADB_EXEC_FAIL
+from metagpt.environment.android.android_ext_env import AndroidExtEnv
+from metagpt.environment.android.const import ADB_EXEC_FAIL
 
 
 def mock_device_shape(self, adb_cmd: str) -> str:
@@ -16,8 +16,8 @@ def mock_device_shape_invalid(self, adb_cmd: str) -> str:
     return ADB_EXEC_FAIL
 
 
-def mock_list_devices(self, adb_cmd: str) -> str:
-    return "devices\nemulator-5554"
+def mock_list_devices(self) -> str:
+    return ["emulator-5554"]
 
 
 def mock_get_screenshot(self, adb_cmd: str) -> str:
@@ -34,9 +34,8 @@ def mock_write_read_operation(self, adb_cmd: str) -> str:
 
 def test_android_ext_env(mocker):
     device_id = "emulator-5554"
-    mocker.patch(
-        "metagpt.environment.android_env.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_device_shape
-    )
+    mocker.patch("metagpt.environment.android.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_device_shape)
+    mocker.patch("metagpt.environment.android.android_ext_env.AndroidExtEnv.list_devices", mock_list_devices)
 
     ext_env = AndroidExtEnv(device_id=device_id, screenshot_dir="/data2/", xml_dir="/data2/")
     assert ext_env.adb_prefix == f"adb -s {device_id} "
@@ -46,25 +45,20 @@ def test_android_ext_env(mocker):
     assert ext_env.device_shape == (720, 1080)
 
     mocker.patch(
-        "metagpt.environment.android_env.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_device_shape_invalid
+        "metagpt.environment.android.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_device_shape_invalid
     )
     assert ext_env.device_shape == (0, 0)
 
-    mocker.patch(
-        "metagpt.environment.android_env.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_list_devices
-    )
     assert ext_env.list_devices() == [device_id]
 
-    mocker.patch(
-        "metagpt.environment.android_env.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_get_screenshot
-    )
+    mocker.patch("metagpt.environment.android.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_get_screenshot)
     assert ext_env.get_screenshot("screenshot_xxxx-xx-xx", "/data/") == Path("/data/screenshot_xxxx-xx-xx.png")
 
-    mocker.patch("metagpt.environment.android_env.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_get_xml)
+    mocker.patch("metagpt.environment.android.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_get_xml)
     assert ext_env.get_xml("xml_xxxx-xx-xx", "/data/") == Path("/data/xml_xxxx-xx-xx.xml")
 
     mocker.patch(
-        "metagpt.environment.android_env.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_write_read_operation
+        "metagpt.environment.android.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_write_read_operation
     )
     res = "OK"
     assert ext_env.system_back() == res
diff --git a/tests/metagpt/environment/minecraft_env/__init__.py b/tests/metagpt/environment/minecraft_env/__init__.py
new file mode 100644
index 0000000000..2bcf8efd09
--- /dev/null
+++ b/tests/metagpt/environment/minecraft_env/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/tests/metagpt/environment/mincraft_env/test_mincraft_ext_env.py b/tests/metagpt/environment/minecraft_env/test_minecraft_ext_env.py
similarity index 50%
rename from tests/metagpt/environment/mincraft_env/test_mincraft_ext_env.py
rename to tests/metagpt/environment/minecraft_env/test_minecraft_ext_env.py
index ad33761416..0ebff22eb6 100644
--- a/tests/metagpt/environment/mincraft_env/test_mincraft_ext_env.py
+++ b/tests/metagpt/environment/minecraft_env/test_minecraft_ext_env.py
@@ -1,14 +1,14 @@
 #!/usr/bin/env python
 # -*- coding: utf-8 -*-
-# @Desc   : the unittest of MincraftExtEnv
+# @Desc   : the unittest of MinecraftExtEnv
 
 
-from metagpt.environment.mincraft_env.const import MC_CKPT_DIR
-from metagpt.environment.mincraft_env.mincraft_ext_env import MincraftExtEnv
+from metagpt.environment.minecraft.const import MC_CKPT_DIR
+from metagpt.environment.minecraft.minecraft_ext_env import MinecraftExtEnv
 
 
-def test_mincraft_ext_env():
-    ext_env = MincraftExtEnv()
+def test_minecraft_ext_env():
+    ext_env = MinecraftExtEnv()
     assert ext_env.server, f"{ext_env.server_host}:{ext_env.server_port}"
     assert MC_CKPT_DIR.joinpath("skill/code").exists()
     assert ext_env.warm_up.get("optional_inventory_items") == 7
diff --git a/tests/metagpt/environment/stanford_town_env/test_stanford_town_ext_env.py b/tests/metagpt/environment/stanford_town_env/test_stanford_town_ext_env.py
index 3071f9deb3..282a45dfa4 100644
--- a/tests/metagpt/environment/stanford_town_env/test_stanford_town_ext_env.py
+++ b/tests/metagpt/environment/stanford_town_env/test_stanford_town_ext_env.py
@@ -4,12 +4,18 @@
 
 from pathlib import Path
 
-from metagpt.environment.stanford_town_env.stanford_town_ext_env import (
-    StanfordTownExtEnv,
+from metagpt.environment.stanford_town.env_space import (
+    EnvAction,
+    EnvActionType,
+    EnvObsParams,
+    EnvObsType,
 )
+from metagpt.environment.stanford_town.stanford_town_ext_env import StanfordTownExtEnv
 
 maze_asset_path = (
-    Path(__file__).absolute().parent.joinpath("..", "..", "..", "data", "environment", "stanford_town", "the_ville")
+    Path(__file__)
+    .absolute()
+    .parent.joinpath("..", "..", "..", "..", "metagpt/ext/stanford_town/static_dirs/assets/the_ville")
 )
 
 
@@ -27,7 +33,6 @@ def test_stanford_town_ext_env():
     assert len(ext_env.get_nearby_tiles(tile=tile, vision_r=5)) == 121
 
     event = ("double studio:double studio:bedroom 2:bed", None, None, None)
-    ext_env.add_tiles_event(tile[1], tile[0], event=event)
     ext_env.add_event_from_tile(event, tile)
     assert len(ext_env.tiles[tile[1]][tile[0]]["events"]) == 1
 
@@ -38,3 +43,22 @@ def test_stanford_town_ext_env():
 
     ext_env.remove_subject_events_from_tile(subject=event[0], tile=tile)
     assert len(ext_env.tiles[tile[1]][tile[0]]["events"]) == 0
+
+
+def test_stanford_town_ext_env_observe_step():
+    ext_env = StanfordTownExtEnv(maze_asset_path=maze_asset_path)
+    obs, info = ext_env.reset()
+    assert len(info) == 0
+    assert len(obs["address_tiles"]) == 306
+
+    tile = (58, 9)
+    obs = ext_env.observe(obs_params=EnvObsParams(obs_type=EnvObsType.TILE_PATH, coord=tile, level="world"))
+    assert obs == "the Ville"
+
+    action = ext_env.action_space.sample()
+    assert len(action) == 4
+    assert len(action["event"]) == 4
+
+    event = ("double studio:double studio:bedroom 2:bed", None, None, None)
+    obs, _, _, _, _ = ext_env.step(action=EnvAction(action_type=EnvActionType.ADD_TILE_EVENT, coord=tile, event=event))
+    assert len(ext_env.tiles[tile[1]][tile[0]]["events"]) == 1
diff --git a/tests/metagpt/environment/test_base_env.py b/tests/metagpt/environment/test_base_env.py
index fd73679d8b..c4f8817484 100644
--- a/tests/metagpt/environment/test_base_env.py
+++ b/tests/metagpt/environment/test_base_env.py
@@ -2,6 +2,8 @@
 # -*- coding: utf-8 -*-
 # @Desc   : the unittest of ExtEnv&Env
 
+from typing import Any, Optional
+
 import pytest
 
 from metagpt.environment.api.env_api import EnvAPIAbstract
@@ -12,11 +14,26 @@
     mark_as_readable,
     mark_as_writeable,
 )
+from metagpt.environment.base_env_space import BaseEnvAction, BaseEnvObsParams
 
 
 class ForTestEnv(Environment):
     value: int = 0
 
+    def reset(
+        self,
+        *,
+        seed: Optional[int] = None,
+        options: Optional[dict[str, Any]] = None,
+    ) -> tuple[dict[str, Any], dict[str, Any]]:
+        pass
+
+    def observe(self, obs_params: Optional[BaseEnvObsParams] = None) -> Any:
+        pass
+
+    def step(self, action: BaseEnvAction) -> tuple[dict[str, Any], float, bool, bool, dict[str, Any]]:
+        pass
+
     @mark_as_readable
     def read_api_no_param(self):
         return self.value
@@ -44,11 +61,11 @@ async def test_ext_env():
     assert len(apis) > 0
     assert len(apis["read_api"]) == 3
 
-    _ = await env.step(EnvAPIAbstract(api_name="write_api", kwargs={"a": 5, "b": 10}))
+    _ = await env.write_thru_api(EnvAPIAbstract(api_name="write_api", kwargs={"a": 5, "b": 10}))
     assert env.value == 15
 
-    with pytest.raises(ValueError):
-        await env.observe("not_exist_api")
+    with pytest.raises(KeyError):
+        await env.read_from_api("not_exist_api")
 
-    assert await env.observe("read_api_no_param") == 15
-    assert await env.observe(EnvAPIAbstract(api_name="read_api", kwargs={"a": 5, "b": 5})) == 10
+    assert await env.read_from_api("read_api_no_param") == 15
+    assert await env.read_from_api(EnvAPIAbstract(api_name="read_api", kwargs={"a": 5, "b": 5})) == 10
diff --git a/tests/metagpt/environment/werewolf_env/test_werewolf_ext_env.py b/tests/metagpt/environment/werewolf_env/test_werewolf_ext_env.py
index 0694c5c3de..986d55e1ae 100644
--- a/tests/metagpt/environment/werewolf_env/test_werewolf_ext_env.py
+++ b/tests/metagpt/environment/werewolf_env/test_werewolf_ext_env.py
@@ -2,33 +2,34 @@
 # -*- coding: utf-8 -*-
 # @Desc   : the unittest of WerewolfExtEnv
 
-from metagpt.environment.werewolf_env.werewolf_ext_env import RoleState, WerewolfExtEnv
+from metagpt.environment.werewolf.const import RoleState, RoleType
+from metagpt.environment.werewolf.werewolf_ext_env import WerewolfExtEnv
 from metagpt.roles.role import Role
 
 
 class Werewolf(Role):
-    profile: str = "Werewolf"
+    profile: str = RoleType.WEREWOLF.value
 
 
 class Villager(Role):
-    profile: str = "Villager"
+    profile: str = RoleType.VILLAGER.value
 
 
 class Witch(Role):
-    profile: str = "Witch"
+    profile: str = RoleType.WITCH.value
 
 
 class Guard(Role):
-    profile: str = "Guard"
+    profile: str = RoleType.GUARD.value
 
 
 def test_werewolf_ext_env():
     players_state = {
-        "Player0": ("Werewolf", RoleState.ALIVE),
-        "Player1": ("Werewolf", RoleState.ALIVE),
-        "Player2": ("Villager", RoleState.ALIVE),
-        "Player3": ("Witch", RoleState.ALIVE),
-        "Player4": ("Guard", RoleState.ALIVE),
+        "Player0": (RoleType.WEREWOLF.value, RoleState.ALIVE),
+        "Player1": (RoleType.WEREWOLF.value, RoleState.ALIVE),
+        "Player2": (RoleType.VILLAGER.value, RoleState.ALIVE),
+        "Player3": (RoleType.WITCH.value, RoleState.ALIVE),
+        "Player4": (RoleType.GUARD.value, RoleState.ALIVE),
     }
     ext_env = WerewolfExtEnv(players_state=players_state, step_idx=4, special_role_players=["Player3", "Player4"])
 
@@ -41,9 +42,9 @@ def test_werewolf_ext_env():
     assert "Werewolves, please open your eyes" in curr_instr["content"]
 
     # current step_idx = 5
-    ext_env.wolf_kill_someone(wolf=Role(name="Player10"), player_name="Player4")
-    ext_env.wolf_kill_someone(wolf=Werewolf(name="Player0"), player_name="Player4")
-    ext_env.wolf_kill_someone(wolf=Werewolf(name="Player1"), player_name="Player4")
+    ext_env.wolf_kill_someone(wolf_name="Player10", player_name="Player4")
+    ext_env.wolf_kill_someone(wolf_name="Player0", player_name="Player4")
+    ext_env.wolf_kill_someone(wolf_name="Player1", player_name="Player4")
     assert ext_env.player_hunted == "Player4"
     assert len(ext_env.living_players) == 5  # hunted but can be saved by witch
 
@@ -52,11 +53,11 @@ def test_werewolf_ext_env():
 
     # current step_idx = 18
     assert ext_env.step_idx == 18
-    ext_env.vote_kill_someone(voteer=Werewolf(name="Player0"), player_name="Player2")
-    ext_env.vote_kill_someone(voteer=Werewolf(name="Player1"), player_name="Player3")
-    ext_env.vote_kill_someone(voteer=Villager(name="Player2"), player_name="Player3")
-    ext_env.vote_kill_someone(voteer=Witch(name="Player3"), player_name="Player4")
-    ext_env.vote_kill_someone(voteer=Guard(name="Player4"), player_name="Player2")
+    ext_env.vote_kill_someone(voter_name="Player0", player_name="Player2")
+    ext_env.vote_kill_someone(voter_name="Player1", player_name="Player3")
+    ext_env.vote_kill_someone(voter_name="Player2", player_name="Player3")
+    ext_env.vote_kill_someone(voter_name="Player3", player_name="Player4")
+    ext_env.vote_kill_someone(voter_name="Player4", player_name="Player2")
     assert ext_env.player_current_dead == "Player2"
     assert len(ext_env.living_players) == 4
 
diff --git a/tests/metagpt/ext/__init__.py b/tests/metagpt/ext/__init__.py
new file mode 100644
index 0000000000..2bcf8efd09
--- /dev/null
+++ b/tests/metagpt/ext/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/tests/metagpt/ext/android_assistant/__init__.py b/tests/metagpt/ext/android_assistant/__init__.py
new file mode 100644
index 0000000000..2bcf8efd09
--- /dev/null
+++ b/tests/metagpt/ext/android_assistant/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/tests/metagpt/ext/android_assistant/test_an.py b/tests/metagpt/ext/android_assistant/test_an.py
new file mode 100644
index 0000000000..d4f398337d
--- /dev/null
+++ b/tests/metagpt/ext/android_assistant/test_an.py
@@ -0,0 +1,85 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : test on android emulator action. After Modify Role Test, this script is discarded.
+
+import asyncio
+import time
+from pathlib import Path
+
+from metagpt.const import TEST_DATA_PATH
+from metagpt.environment.android.android_env import AndroidEnv
+from metagpt.ext.android_assistant.actions.manual_record import ManualRecord
+from metagpt.ext.android_assistant.actions.parse_record import ParseRecord
+from metagpt.ext.android_assistant.actions.screenshot_parse import ScreenshotParse
+from metagpt.ext.android_assistant.actions.self_learn_and_reflect import (
+    SelfLearnAndReflect,
+)
+
+TASK_PATH = TEST_DATA_PATH.joinpath("andriod_assistant/unitest_Contacts")
+TASK_PATH.mkdir(parents=True, exist_ok=True)
+DEMO_NAME = str(time.time())
+SELF_EXPLORE_DOC_PATH = TASK_PATH.joinpath("auto_docs")
+PARSE_RECORD_DOC_PATH = TASK_PATH.joinpath("demo_docs")
+
+device_id = "emulator-5554"
+xml_dir = Path("/sdcard")
+screenshot_dir = Path("/sdcard/Pictures/Screenshots")
+
+test_env_self_learn_android = AndroidEnv(
+    device_id=device_id,
+    xml_dir=xml_dir,
+    screenshot_dir=screenshot_dir,
+)
+test_self_learning = SelfLearnAndReflect()
+
+test_env_manual_learn_android = AndroidEnv(
+    device_id=device_id,
+    xml_dir=xml_dir,
+    screenshot_dir=screenshot_dir,
+)
+test_manual_record = ManualRecord()
+test_manual_parse = ParseRecord()
+
+test_env_screenshot_parse_android = AndroidEnv(
+    device_id=device_id,
+    xml_dir=xml_dir,
+    screenshot_dir=screenshot_dir,
+)
+test_screenshot_parse = ScreenshotParse()
+
+
+if __name__ == "__main__":
+    loop = asyncio.get_event_loop()
+
+    test_action_list = [
+        test_self_learning.run(
+            round_count=20,
+            task_desc="Create a contact in Contacts App named zjy with a phone number +86 18831933368 ",
+            last_act="",
+            task_dir=TASK_PATH / "demos" / f"self_learning_{DEMO_NAME}",
+            docs_dir=SELF_EXPLORE_DOC_PATH,
+            env=test_env_self_learn_android,
+        ),
+        test_manual_record.run(
+            task_dir=TASK_PATH / "demos" / f"manual_record_{DEMO_NAME}",
+            task_desc="Create a contact in Contacts App named zjy with a phone number +86 18831933368 ",
+            env=test_env_manual_learn_android,
+        ),
+        test_manual_parse.run(
+            task_dir=TASK_PATH / "demos" / f"manual_record_{DEMO_NAME}",  # 修要修改
+            docs_dir=PARSE_RECORD_DOC_PATH,  # 需要修改
+            env=test_env_manual_learn_android,
+        ),
+        test_screenshot_parse.run(
+            round_count=20,
+            task_desc="Create a contact in Contacts App named zjy with a phone number +86 18831933368 ",
+            last_act="",
+            task_dir=TASK_PATH / f"act_{DEMO_NAME}",
+            docs_dir=PARSE_RECORD_DOC_PATH,
+            env=test_env_screenshot_parse_android,
+            grid_on=False,
+        ),
+    ]
+
+    loop.run_until_complete(asyncio.gather(*test_action_list))
+    loop.close()
diff --git a/tests/metagpt/ext/android_assistant/test_parse_record.py b/tests/metagpt/ext/android_assistant/test_parse_record.py
new file mode 100644
index 0000000000..5299d30a23
--- /dev/null
+++ b/tests/metagpt/ext/android_assistant/test_parse_record.py
@@ -0,0 +1,29 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : test case (imgs from appagent's)
+
+import asyncio
+
+from metagpt.actions.action import Action
+from metagpt.const import TEST_DATA_PATH
+from metagpt.ext.android_assistant.actions.parse_record import ParseRecord
+
+TASK_PATH = TEST_DATA_PATH.joinpath("andriod_assistant/demo_Contacts")
+TEST_BEFORE_PATH = TASK_PATH.joinpath("labeled_screenshots/0_labeled.png")
+TEST_AFTER_PATH = TASK_PATH.joinpath("labeled_screenshots/1_labeled.png")
+RECORD_PATH = TASK_PATH.joinpath("record.txt")
+TASK_DESC_PATH = TASK_PATH.joinpath("task_desc.txt")
+DOCS_DIR = TASK_PATH.joinpath("storage")
+
+test_action = Action(name="test")
+
+
+async def manual_learn_test():
+    parse_record = ParseRecord()
+    await parse_record.run(app_name="demo_Contacts", task_dir=TASK_PATH, docs_dir=DOCS_DIR)
+
+
+if __name__ == "__main__":
+    loop = asyncio.get_event_loop()
+    loop.run_until_complete(manual_learn_test())
+    loop.close()
diff --git a/tests/metagpt/ext/stanford_town/__init__.py b/tests/metagpt/ext/stanford_town/__init__.py
new file mode 100644
index 0000000000..2bcf8efd09
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/tests/metagpt/ext/stanford_town/actions/__init__.py b/tests/metagpt/ext/stanford_town/actions/__init__.py
new file mode 100644
index 0000000000..2bcf8efd09
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/actions/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/tests/metagpt/ext/stanford_town/actions/test_gen_action_details.py b/tests/metagpt/ext/stanford_town/actions/test_gen_action_details.py
new file mode 100644
index 0000000000..616c03f338
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/actions/test_gen_action_details.py
@@ -0,0 +1,79 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : unittest of actions/gen_action_details.py
+
+import pytest
+
+from metagpt.environment import StanfordTownEnv
+from metagpt.environment.api.env_api import EnvAPIAbstract
+from metagpt.ext.stanford_town.actions.gen_action_details import (
+    GenActionArena,
+    GenActionDetails,
+    GenActionObject,
+    GenActionSector,
+    GenActObjDescription,
+)
+from metagpt.ext.stanford_town.roles.st_role import STRole
+from metagpt.ext.stanford_town.utils.const import MAZE_ASSET_PATH
+
+
+@pytest.mark.asyncio
+async def test_gen_action_details():
+    role = STRole(
+        name="Klaus Mueller",
+        start_time="February 13, 2023",
+        curr_time="February 13, 2023, 00:00:00",
+        sim_code="base_the_ville_isabella_maria_klaus",
+    )
+    role.set_env(StanfordTownEnv(maze_asset_path=MAZE_ASSET_PATH))
+    await role.init_curr_tile()
+
+    act_desp = "sleeping"
+    act_dura = "120"
+
+    access_tile = await role.rc.env.read_from_api(
+        EnvAPIAbstract(api_name="access_tile", kwargs={"tile": role.scratch.curr_tile})
+    )
+    act_world = access_tile["world"]
+    assert act_world == "the Ville"
+
+    sector = await GenActionSector().run(role, access_tile, act_desp)
+    arena = await GenActionArena().run(role, act_desp, act_world, sector)
+    temp_address = f"{act_world}:{sector}:{arena}"
+    obj = await GenActionObject().run(role, act_desp, temp_address)
+
+    act_obj_desp = await GenActObjDescription().run(role, obj, act_desp)
+
+    result_dict = await GenActionDetails().run(role, act_desp, act_dura)
+
+    # gen_action_sector
+    assert isinstance(sector, str)
+    assert sector in role.s_mem.get_str_accessible_sectors(act_world)
+
+    # gen_action_arena
+    assert isinstance(arena, str)
+    assert arena in role.s_mem.get_str_accessible_sector_arenas(f"{act_world}:{sector}")
+
+    # gen_action_obj
+    assert isinstance(obj, str)
+    assert obj in role.s_mem.get_str_accessible_arena_game_objects(temp_address)
+
+    if result_dict:
+        for key in [
+            "action_address",
+            "action_duration",
+            "action_description",
+            "action_pronunciatio",
+            "action_event",
+            "chatting_with",
+            "chat",
+            "chatting_with_buffer",
+            "chatting_end_time",
+            "act_obj_description",
+            "act_obj_pronunciatio",
+            "act_obj_event",
+        ]:
+            assert key in result_dict
+    assert result_dict["action_address"] == f"{temp_address}:{obj}"
+    assert result_dict["action_duration"] == int(act_dura)
+    assert result_dict["act_obj_description"] == act_obj_desp
diff --git a/tests/metagpt/ext/stanford_town/actions/test_summarize_conv.py b/tests/metagpt/ext/stanford_town/actions/test_summarize_conv.py
new file mode 100644
index 0000000000..5dfabcab90
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/actions/test_summarize_conv.py
@@ -0,0 +1,15 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : unittest of actions/summarize_conv
+
+import pytest
+
+from metagpt.ext.stanford_town.actions.summarize_conv import SummarizeConv
+
+
+@pytest.mark.asyncio
+async def test_summarize_conv():
+    conv = [("Role_A", "what's the weather today?"), ("Role_B", "It looks pretty good, and I will take a walk then.")]
+
+    output = await SummarizeConv().run(conv)
+    assert "weather" in output
diff --git a/tests/metagpt/ext/stanford_town/memory/__init__.py b/tests/metagpt/ext/stanford_town/memory/__init__.py
new file mode 100644
index 0000000000..2bcf8efd09
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/memory/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/tests/metagpt/ext/stanford_town/memory/test_agent_memory.py b/tests/metagpt/ext/stanford_town/memory/test_agent_memory.py
new file mode 100644
index 0000000000..db7ca3212d
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/memory/test_agent_memory.py
@@ -0,0 +1,89 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : the unittest of AgentMemory
+
+from datetime import datetime, timedelta
+
+import pytest
+
+from metagpt.ext.stanford_town.memory.agent_memory import AgentMemory
+from metagpt.ext.stanford_town.memory.retrieve import agent_retrieve
+from metagpt.ext.stanford_town.utils.const import STORAGE_PATH
+from metagpt.logs import logger
+
+"""
+memory测试思路
+1. Basic Memory测试
+2. Agent Memory测试
+    2.1 Load & Save方法测试; Load方法中使用了add方法，验证Load即可验证所有add
+    2.2 Get方法测试
+"""
+memory_easy_storage_path = STORAGE_PATH.joinpath(
+    "base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory",
+)
+memroy_chat_storage_path = STORAGE_PATH.joinpath(
+    "base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory",
+)
+memory_save_easy_test_path = STORAGE_PATH.joinpath(
+    "base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/test_memory",
+)
+memory_save_chat_test_path = STORAGE_PATH.joinpath(
+    "base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/test_memory",
+)
+
+
+class TestAgentMemory:
+    @pytest.fixture
+    def agent_memory(self):
+        # 创建一个AgentMemory实例并返回，可以在所有测试用例中共享
+        test_agent_memory = AgentMemory()
+        test_agent_memory.set_mem_path(memroy_chat_storage_path)
+        return test_agent_memory
+
+    def test_load(self, agent_memory):
+        logger.info(f"存储路径为：{agent_memory.memory_saved}")
+        logger.info(f"存储记忆条数为：{len(agent_memory.storage)}")
+        logger.info(f"kw_strength为{agent_memory.kw_strength_event},{agent_memory.kw_strength_thought}")
+        logger.info(f"embeeding.json条数为{len(agent_memory.embeddings)}")
+
+        assert agent_memory.embeddings is not None
+
+    def test_save(self, agent_memory):
+        try:
+            agent_memory.save(memory_save_chat_test_path)
+            logger.info("成功存储")
+        except:
+            pass
+
+    def test_summary_function(self, agent_memory):
+        logger.info(f"event长度为{len(agent_memory.event_list)}")
+        logger.info(f"thought长度为{len(agent_memory.thought_list)}")
+        logger.info(f"chat长度为{len(agent_memory.chat_list)}")
+        result1 = agent_memory.get_summarized_latest_events(4)
+        logger.info(f"总结最近事件结果为:{result1}")
+
+    def test_get_last_chat_function(self, agent_memory):
+        result2 = agent_memory.get_last_chat("customers")
+        logger.info(f"上一次对话是{result2}")
+
+    def test_retrieve_function(self, agent_memory):
+        focus_points = ["who i love?"]
+        retrieved = dict()
+        for focal_pt in focus_points:
+            nodes = [
+                [i.last_accessed, i]
+                for i in agent_memory.event_list + agent_memory.thought_list
+                if "idle" not in i.embedding_key
+            ]
+            nodes = sorted(nodes, key=lambda x: x[0])
+            nodes = [i for created, i in nodes]
+            results = agent_retrieve(agent_memory, datetime.now() - timedelta(days=120), 0.99, focal_pt, nodes, 5)
+            final_result = []
+            for n in results:
+                for i in agent_memory.storage:
+                    if i.memory_id == n:
+                        i.last_accessed = datetime.now() - timedelta(days=120)
+                        final_result.append(i)
+
+            retrieved[focal_pt] = final_result
+        logger.info(f"检索结果为{retrieved}")
diff --git a/tests/metagpt/ext/stanford_town/memory/test_basic_memory.py b/tests/metagpt/ext/stanford_town/memory/test_basic_memory.py
new file mode 100644
index 0000000000..36a9b2f99c
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/memory/test_basic_memory.py
@@ -0,0 +1,76 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : the unittest of BasicMemory
+
+from datetime import datetime, timedelta
+
+import pytest
+
+from metagpt.ext.stanford_town.memory.agent_memory import BasicMemory
+from metagpt.logs import logger
+
+"""
+memory测试思路
+1. Basic Memory测试
+2. Agent Memory测试
+    2.1 Load & Save方法测试
+    2.2 Add方法测试
+    2.3 Get方法测试
+"""
+
+# Create some sample BasicMemory instances
+memory1 = BasicMemory(
+    memory_id="1",
+    memory_count=1,
+    type_count=1,
+    memory_type="event",
+    depth=1,
+    created=datetime.now(),
+    expiration=datetime.now() + timedelta(days=30),
+    subject="Subject1",
+    predicate="Predicate1",
+    object="Object1",
+    content="This is content 1",
+    embedding_key="embedding_key_1",
+    poignancy=1,
+    keywords=["keyword1", "keyword2"],
+    filling=["memory_id_2"],
+)
+memory2 = BasicMemory(
+    memory_id="2",
+    memory_count=2,
+    type_count=2,
+    memory_type="thought",
+    depth=2,
+    created=datetime.now(),
+    expiration=datetime.now() + timedelta(days=30),
+    subject="Subject2",
+    predicate="Predicate2",
+    object="Object2",
+    content="This is content 2",
+    embedding_key="embedding_key_2",
+    poignancy=2,
+    keywords=["keyword3", "keyword4"],
+    filling=[],
+)
+
+
+@pytest.fixture
+def basic_mem_set():
+    basic_mem2 = memory2
+    yield basic_mem2
+
+
+def test_basic_mem_function(basic_mem_set):
+    a, b, c = basic_mem_set.summary()
+    logger.info(f"{a}{b}{c}")
+    assert a == "Subject2"
+
+
+def test_basic_mem_save(basic_mem_set):
+    result = basic_mem_set.save_to_dict()
+    logger.info(f"save结果为{result}")
+
+
+if __name__ == "__main__":
+    pytest.main()
diff --git a/tests/metagpt/ext/stanford_town/memory/test_spatial_memory.py b/tests/metagpt/ext/stanford_town/memory/test_spatial_memory.py
new file mode 100644
index 0000000000..e05b273fd8
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/memory/test_spatial_memory.py
@@ -0,0 +1,17 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : the unittest of MemoryTree
+
+from metagpt.ext.stanford_town.memory.spatial_memory import MemoryTree
+from metagpt.ext.stanford_town.utils.const import STORAGE_PATH
+
+
+def test_spatial_memory():
+    f_path = STORAGE_PATH.joinpath(
+        "base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/spatial_memory.json"
+    )
+    x = MemoryTree()
+    x.set_mem_path(f_path)
+    assert x.tree
+    assert "the Ville" in x.tree
+    assert "Isabella Rodriguez's apartment" in x.get_str_accessible_sectors("the Ville")
diff --git a/tests/metagpt/ext/stanford_town/plan/__init__.py b/tests/metagpt/ext/stanford_town/plan/__init__.py
new file mode 100644
index 0000000000..2bcf8efd09
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/plan/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/tests/metagpt/ext/stanford_town/plan/test_conversation.py b/tests/metagpt/ext/stanford_town/plan/test_conversation.py
new file mode 100644
index 0000000000..35dd216f95
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/plan/test_conversation.py
@@ -0,0 +1,67 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : unittest of roles conversation
+
+from typing import Tuple
+
+import pytest
+
+from metagpt.environment import StanfordTownEnv
+from metagpt.ext.stanford_town.plan.converse import agent_conversation
+from metagpt.ext.stanford_town.roles.st_role import STRole
+from metagpt.ext.stanford_town.utils.const import MAZE_ASSET_PATH, STORAGE_PATH
+from metagpt.ext.stanford_town.utils.mg_ga_transform import get_reverie_meta
+from metagpt.ext.stanford_town.utils.utils import copy_folder
+
+
+async def init_two_roles(fork_sim_code: str = "base_the_ville_isabella_maria_klaus") -> Tuple["STRole"]:
+    sim_code = "unittest_sim"
+
+    copy_folder(str(STORAGE_PATH.joinpath(fork_sim_code)), str(STORAGE_PATH.joinpath(sim_code)))
+
+    reverie_meta = get_reverie_meta(fork_sim_code)
+    role_ir_name = "Isabella Rodriguez"
+    role_km_name = "Klaus Mueller"
+
+    env = StanfordTownEnv(maze_asset_path=MAZE_ASSET_PATH)
+
+    role_ir = STRole(
+        name=role_ir_name,
+        sim_code=sim_code,
+        profile=role_ir_name,
+        step=reverie_meta.get("step"),
+        start_time=reverie_meta.get("start_date"),
+        curr_time=reverie_meta.get("curr_time"),
+        sec_per_step=reverie_meta.get("sec_per_step"),
+    )
+    role_ir.set_env(env)
+    await role_ir.init_curr_tile()
+
+    role_km = STRole(
+        name=role_km_name,
+        sim_code=sim_code,
+        profile=role_km_name,
+        step=reverie_meta.get("step"),
+        start_time=reverie_meta.get("start_date"),
+        curr_time=reverie_meta.get("curr_time"),
+        sec_per_step=reverie_meta.get("sec_per_step"),
+    )
+    role_km.set_env(env)
+    await role_km.init_curr_tile()
+
+    return role_ir, role_km
+
+
+@pytest.mark.asyncio
+async def test_agent_conversation():
+    role_ir, role_km = await init_two_roles()
+
+    curr_chat = await agent_conversation(role_ir, role_km, conv_rounds=2)
+    assert len(curr_chat) % 2 == 0
+
+    meet = False
+    for conv in curr_chat:
+        if "Valentine's Day party" in conv[1]:
+            # conv[0] speaker, conv[1] utterance
+            meet = True
+    assert meet
diff --git a/tests/metagpt/ext/stanford_town/plan/test_st_plan.py b/tests/metagpt/ext/stanford_town/plan/test_st_plan.py
new file mode 100644
index 0000000000..f7f3950406
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/plan/test_st_plan.py
@@ -0,0 +1,25 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : unittest of st_plan
+
+
+import pytest
+
+from metagpt.ext.stanford_town.plan.st_plan import _choose_retrieved, _should_react
+from tests.metagpt.ext.stanford_town.plan.test_conversation import init_two_roles
+
+
+@pytest.mark.asyncio
+async def test_should_react():
+    role_ir, role_km = await init_two_roles()
+    roles = {role_ir.name: role_ir, role_km.name: role_km}
+    role_ir.scratch.act_address = "mock data"
+
+    observed = await role_ir.observe()
+    retrieved = role_ir.retrieve(observed)
+
+    focused_event = _choose_retrieved(role_ir.name, retrieved)
+
+    if focused_event:
+        reaction_mode = await _should_react(role_ir, focused_event, roles)  # chat with Isabella Rodriguez
+        assert not reaction_mode
diff --git a/tests/metagpt/ext/stanford_town/roles/__init__.py b/tests/metagpt/ext/stanford_town/roles/__init__.py
new file mode 100644
index 0000000000..2bcf8efd09
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/roles/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/tests/metagpt/ext/stanford_town/roles/test_st_role.py b/tests/metagpt/ext/stanford_town/roles/test_st_role.py
new file mode 100644
index 0000000000..affa6e87fa
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/roles/test_st_role.py
@@ -0,0 +1,26 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : the unittest of STRole
+
+import pytest
+
+from metagpt.environment import StanfordTownEnv
+from metagpt.ext.stanford_town.memory.agent_memory import BasicMemory
+from metagpt.ext.stanford_town.roles.st_role import STRole
+from metagpt.ext.stanford_town.utils.const import MAZE_ASSET_PATH
+
+
+@pytest.mark.asyncio
+async def test_observe():
+    role = STRole(
+        sim_code="base_the_ville_isabella_maria_klaus",
+        start_time="February 13, 2023",
+        curr_time="February 13, 2023, 00:00:00",
+    )
+    role.set_env(StanfordTownEnv(maze_asset_path=MAZE_ASSET_PATH))
+    await role.init_curr_tile()
+
+    ret_events = await role.observe()
+    assert ret_events
+    for event in ret_events:
+        assert isinstance(event, BasicMemory)
diff --git a/tests/metagpt/ext/stanford_town/test_reflect.py b/tests/metagpt/ext/stanford_town/test_reflect.py
new file mode 100644
index 0000000000..0be23166ca
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/test_reflect.py
@@ -0,0 +1,47 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : the unittest of reflection
+
+import pytest
+
+from metagpt.environment import StanfordTownEnv
+from metagpt.ext.stanford_town.actions.run_reflect_action import (
+    AgentEventTriple,
+    AgentFocusPt,
+    AgentInsightAndGuidance,
+)
+from metagpt.ext.stanford_town.roles.st_role import STRole
+from metagpt.ext.stanford_town.utils.const import MAZE_ASSET_PATH
+
+
+@pytest.mark.asyncio
+async def test_reflect():
+    """
+    init STRole form local json, set sim_code(path),curr_time & start_time
+    """
+    role = STRole(
+        sim_code="base_the_ville_isabella_maria_klaus",
+        start_time="February 13, 2023",
+        curr_time="February 13, 2023, 00:00:00",
+    )
+    role.set_env(StanfordTownEnv(maze_asset_path=MAZE_ASSET_PATH))
+    role.init_curr_tile()
+
+    run_focus = AgentFocusPt()
+    statements = ""
+    await run_focus.run(role, statements, n=3)
+
+    """
+    这里有通过测试的结果，但是更多时候LLM生成的结果缺少了because of；考虑修改一下prompt
+    result = {'Klaus Mueller and Maria Lopez have a close relationship because they have been friends for a long time and have a strong bond': [1, 2, 5, 9, 11, 14], 'Klaus Mueller has a crush on Maria Lopez': [8, 15, 24], 'Klaus Mueller is academically inclined and actively researching a topic': [13, 20], 'Klaus Mueller is socially active and acquainted with Isabella Rodriguez': [17, 21, 22], 'Klaus Mueller is organized and prepared': [19]}
+    """
+    run_insight = AgentInsightAndGuidance()
+    statements = "[user: Klaus Mueller has a close relationship with Maria Lopez, user:s Mueller and Maria Lopez have a close relationship, user: Klaus Mueller has a close relationship with Maria Lopez, user: Klaus Mueller has a close relationship with Maria Lopez, user: Klaus Mueller and Maria Lopez have a strong relationship, user: Klaus Mueller is a dormmate of Maria Lopez., user: Klaus Mueller and Maria Lopez have a strong bond, user: Klaus Mueller has a crush on Maria Lopez, user: Klaus Mueller and Maria Lopez have been friends for more than 2 years., user: Klaus Mueller has a close relationship with Maria Lopez, user: Klaus Mueller Maria Lopez is heading off to college., user: Klaus Mueller and Maria Lopez have a close relationship, user: Klaus Mueller is actively researching a topic, user: Klaus Mueller is close friends and classmates with Maria Lopez., user: Klaus Mueller is socially active, user: Klaus Mueller has a crush on Maria Lopez., user: Klaus Mueller and Maria Lopez have been friends for a long time, user: Klaus Mueller is academically inclined, user: For Klaus Mueller's planning: should remember to ask Maria Lopez about her research paper, as she found it interesting that he mentioned it., user: Klaus Mueller is acquainted with Isabella Rodriguez, user: Klaus Mueller is organized and prepared, user: Maria Lopez is conversing about conversing about Maria's research paper mentioned by Klaus, user: Klaus Mueller is conversing about conversing about Maria's research paper mentioned by Klaus, user: Klaus Mueller is a student, user: Klaus Mueller is a student, user: Klaus Mueller is conversing about two friends named Klaus Mueller and Maria Lopez discussing their morning plans and progress on a research paper before Maria heads off to college., user: Klaus Mueller is socially active, user: Klaus Mueller is socially active, user: Klaus Mueller is socially active and acquainted with Isabella Rodriguez, user: Klaus Mueller has a crush on Maria Lopez]"
+    await run_insight.run(role, statements, n=5)
+
+    run_triple = AgentEventTriple()
+    statements = "(Klaus Mueller is academically inclined)"
+    await run_triple.run(statements, role)
+
+    role.scratch.importance_trigger_curr = -1
+    role.reflect()
diff --git a/tests/metagpt/ext/werewolf/__init__.py b/tests/metagpt/ext/werewolf/__init__.py
new file mode 100644
index 0000000000..2bcf8efd09
--- /dev/null
+++ b/tests/metagpt/ext/werewolf/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/tests/metagpt/ext/werewolf/actions/__init__.py b/tests/metagpt/ext/werewolf/actions/__init__.py
new file mode 100644
index 0000000000..2bcf8efd09
--- /dev/null
+++ b/tests/metagpt/ext/werewolf/actions/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/tests/metagpt/ext/werewolf/actions/test_experience_operation.py b/tests/metagpt/ext/werewolf/actions/test_experience_operation.py
new file mode 100644
index 0000000000..a31abc49a7
--- /dev/null
+++ b/tests/metagpt/ext/werewolf/actions/test_experience_operation.py
@@ -0,0 +1,164 @@
+import json
+
+import pytest
+
+from metagpt.const import DEFAULT_WORKSPACE_ROOT
+from metagpt.ext.werewolf.actions import AddNewExperiences, RetrieveExperiences
+from metagpt.ext.werewolf.schema import RoleExperience
+from metagpt.logs import logger
+
+
+class TestExperiencesOperation:
+    collection_name = "test"
+    test_round_id = "test_01"
+    version = "test"
+    samples_to_add = [
+        RoleExperience(
+            profile="Witch",
+            reflection="The game is intense with two players claiming to be the Witch and one claiming to be the Seer. "
+            "Player4's behavior is suspicious.",
+            response="",
+            outcome="",
+            round_id=test_round_id,
+            version=version,
+        ),
+        RoleExperience(
+            profile="Witch",
+            reflection="The game is in a critical state with only three players left, "
+            "and I need to make a wise decision to save Player7 or not.",
+            response="",
+            outcome="",
+            round_id=test_round_id,
+            version=version,
+        ),
+        RoleExperience(
+            profile="Seer",
+            reflection="Player1, who is a werewolf, falsely claimed to be a Seer, and Player6, who might be a Witch, "
+            "sided with him. I, as the real Seer, am under suspicion.",
+            response="",
+            outcome="",
+            round_id=test_round_id,
+            version=version,
+        ),
+        RoleExperience(
+            profile="TestRole",
+            reflection="Some test reflection1",
+            response="",
+            outcome="",
+            round_id=test_round_id,
+            version=version + "_01-10",
+        ),
+        RoleExperience(
+            profile="TestRole",
+            reflection="Some test reflection2",
+            response="",
+            outcome="",
+            round_id=test_round_id,
+            version=version + "_11-20",
+        ),
+        RoleExperience(
+            profile="TestRole",
+            reflection="Some test reflection3",
+            response="",
+            outcome="",
+            round_id=test_round_id,
+            version=version + "_21-30",
+        ),
+    ]
+
+    @pytest.mark.asyncio
+    async def test_add(self):
+        saved_file = DEFAULT_WORKSPACE_ROOT.joinpath(
+            f"werewolf_game/experiences/{self.version}/{self.test_round_id}.json"
+        )
+        if saved_file.exists():
+            saved_file.unlink()
+
+        action = AddNewExperiences(collection_name=self.collection_name, delete_existing=True)
+        action.run(self.samples_to_add)
+
+        # test insertion
+        inserted = action.engine.retriever._index._vector_store._collection.get()
+        assert len(inserted["documents"]) == len(self.samples_to_add)
+
+        # test if we record the samples correctly to local file
+        # & test if we could recover a embedding db from the file
+        action = AddNewExperiences(collection_name=self.collection_name, delete_existing=True)
+        action.add_from_file(saved_file)
+        inserted = action.engine.retriever._index._vector_store._collection.get()
+        assert len(inserted["documents"]) == len(self.samples_to_add)
+
+    @pytest.mark.asyncio
+    async def test_retrieve(self):
+        action = RetrieveExperiences(collection_name=self.collection_name)
+
+        query = "one player claimed to be Seer and the other Witch"
+        results = action.run(query, profile="Witch")
+        results = json.loads(results)
+
+        assert len(results) == 2, "Witch should have 2 experiences"
+        assert "The game is intense with two players" in results[0]
+
+    @pytest.mark.asyncio
+    async def test_retrieve_filtering(self):
+        action = RetrieveExperiences(collection_name=self.collection_name)
+
+        query = "some test query"
+        profile = "TestRole"
+
+        excluded_version = ""
+        results = action.run(query, profile=profile, excluded_version=excluded_version)
+        results = json.loads(results)
+        assert len(results) == 3
+
+        excluded_version = self.version + "_21-30"
+        results = action.run(query, profile=profile, excluded_version=excluded_version)
+        results = json.loads(results)
+        assert len(results) == 2
+
+
+class TestActualRetrieve:
+    collection_name = "role_reflection"
+
+    @pytest.mark.asyncio
+    async def test_check_experience_pool(self):
+        logger.info("check experience pool")
+        action = RetrieveExperiences(collection_name=self.collection_name)
+        if action.engine:
+            all_experiences = action.engine.retriever._index._vector_store._collection.get()
+            logger.info(f"{len(all_experiences['metadatas'])=}")
+
+    @pytest.mark.asyncio
+    async def test_retrieve_werewolf_experience(self):
+        action = RetrieveExperiences(collection_name=self.collection_name)
+
+        query = "there are conflicts"
+
+        logger.info(f"test retrieval with {query=}")
+        action.run(query, "Werewolf")
+
+    @pytest.mark.asyncio
+    async def test_retrieve_villager_experience(self):
+        action = RetrieveExperiences(collection_name=self.collection_name)
+
+        query = "there are conflicts"
+
+        logger.info(f"test retrieval with {query=}")
+        results = action.run(query, "Seer")
+        assert "conflict" not in results  # 相似局面应该需要包含conflict关键词
+
+    @pytest.mark.asyncio
+    async def test_retrieve_villager_experience_filtering(self):
+        action = RetrieveExperiences(collection_name=self.collection_name)
+
+        query = "there are conflicts"
+
+        excluded_version = "01-10"
+        logger.info(f"test retrieval with {excluded_version=}")
+        results_01_10 = action.run(query, profile="Seer", excluded_version=excluded_version, verbose=True)
+
+        excluded_version = "11-20"
+        logger.info(f"test retrieval with {excluded_version=}")
+        results_11_20 = action.run(query, profile="Seer", excluded_version=excluded_version, verbose=True)
+
+        assert results_01_10 == results_11_20
diff --git a/tests/metagpt/memory/mock_text_embed.py b/tests/metagpt/memory/mock_text_embed.py
index 897c7cf104..2f3ffc434a 100644
--- a/tests/metagpt/memory/mock_text_embed.py
+++ b/tests/metagpt/memory/mock_text_embed.py
@@ -2,32 +2,41 @@
 # -*- coding: utf-8 -*-
 # @Desc   :
 
-from typing import Optional
-
 import numpy as np
 
 dim = 1536  # openai embedding dim
+embed_zeros_arrr = np.zeros(shape=[1, dim]).tolist()
+embed_ones_arrr = np.ones(shape=[1, dim]).tolist()
 
 text_embed_arr = [
-    {"text": "Write a cli snake game", "embed": np.zeros(shape=[1, dim])},  # mock data, same as below
-    {"text": "Write a game of cli snake", "embed": np.zeros(shape=[1, dim])},
-    {"text": "Write a 2048 web game", "embed": np.ones(shape=[1, dim])},
-    {"text": "Write a Battle City", "embed": np.ones(shape=[1, dim])},
+    {"text": "Write a cli snake game", "embed": embed_zeros_arrr},  # mock data, same as below
+    {"text": "Write a game of cli snake", "embed": embed_zeros_arrr},
+    {"text": "Write a 2048 web game", "embed": embed_ones_arrr},
+    {"text": "Write a Battle City", "embed": embed_ones_arrr},
     {
         "text": "The user has requested the creation of a command-line interface (CLI) snake game",
-        "embed": np.zeros(shape=[1, dim]),
+        "embed": embed_zeros_arrr,
     },
-    {"text": "The request is command-line interface (CLI) snake game", "embed": np.zeros(shape=[1, dim])},
+    {"text": "The request is command-line interface (CLI) snake game", "embed": embed_zeros_arrr},
     {
         "text": "Incorporate basic features of a snake game such as scoring and increasing difficulty",
-        "embed": np.ones(shape=[1, dim]),
+        "embed": embed_ones_arrr,
     },
 ]
 
 text_idx_dict = {item["text"]: idx for idx, item in enumerate(text_embed_arr)}
 
 
-def mock_openai_embed_documents(self, texts: list[str], chunk_size: Optional[int] = 0) -> list[list[float]]:
+def mock_openai_embed_documents(self, texts: list[str], show_progress: bool = False) -> list[list[float]]:
     idx = text_idx_dict.get(texts[0])
     embed = text_embed_arr[idx].get("embed")
     return embed
+
+
+def mock_openai_embed_document(self, text: str) -> list[float]:
+    embeds = mock_openai_embed_documents(self, [text])
+    return embeds[0]
+
+
+async def mock_openai_aembed_document(self, text: str) -> list[float]:
+    return mock_openai_embed_document(self, text)
diff --git a/tests/metagpt/memory/test_longterm_memory.py b/tests/metagpt/memory/test_longterm_memory.py
index f7e6527582..990017feec 100644
--- a/tests/metagpt/memory/test_longterm_memory.py
+++ b/tests/metagpt/memory/test_longterm_memory.py
@@ -12,13 +12,20 @@
 from metagpt.roles.role import RoleContext
 from metagpt.schema import Message
 from tests.metagpt.memory.mock_text_embed import (
+    mock_openai_aembed_document,
+    mock_openai_embed_document,
     mock_openai_embed_documents,
     text_embed_arr,
 )
 
 
-def test_ltm_search(mocker):
-    mocker.patch("langchain_community.embeddings.openai.OpenAIEmbeddings.embed_documents", mock_openai_embed_documents)
+@pytest.mark.asyncio
+async def test_ltm_search(mocker):
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embeddings", mock_openai_embed_documents)
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embedding", mock_openai_embed_document)
+    mocker.patch(
+        "llama_index.embeddings.openai.base.OpenAIEmbedding._aget_query_embedding", mock_openai_aembed_document
+    )
 
     role_id = "UTUserLtm(Product Manager)"
     from metagpt.environment import Environment
@@ -31,39 +38,24 @@ def test_ltm_search(mocker):
 
     idea = text_embed_arr[0].get("text", "Write a cli snake game")
     message = Message(role="User", content=idea, cause_by=UserRequirement)
-    news = ltm.find_news([message])
+    news = await ltm.find_news([message])
     assert len(news) == 1
     ltm.add(message)
 
     sim_idea = text_embed_arr[1].get("text", "Write a game of cli snake")
 
     sim_message = Message(role="User", content=sim_idea, cause_by=UserRequirement)
-    news = ltm.find_news([sim_message])
+    news = await ltm.find_news([sim_message])
     assert len(news) == 0
     ltm.add(sim_message)
 
     new_idea = text_embed_arr[2].get("text", "Write a 2048 web game")
     new_message = Message(role="User", content=new_idea, cause_by=UserRequirement)
-    news = ltm.find_news([new_message])
+    news = await ltm.find_news([new_message])
     assert len(news) == 1
     ltm.add(new_message)
 
-    # restore from local index
-    ltm_new = LongTermMemory()
-    ltm_new.recover_memory(role_id, rc)
-    news = ltm_new.find_news([message])
-    assert len(news) == 0
-
-    ltm_new.recover_memory(role_id, rc)
-    news = ltm_new.find_news([sim_message])
-    assert len(news) == 0
-
-    new_idea = text_embed_arr[3].get("text", "Write a Battle City")
-    new_message = Message(role="User", content=new_idea, cause_by=UserRequirement)
-    news = ltm_new.find_news([new_message])
-    assert len(news) == 1
-
-    ltm_new.clear()
+    ltm.clear()
 
 
 if __name__ == "__main__":
diff --git a/tests/metagpt/memory/test_memory_storage.py b/tests/metagpt/memory/test_memory_storage.py
index 28a73276b7..09671aaab9 100644
--- a/tests/metagpt/memory/test_memory_storage.py
+++ b/tests/metagpt/memory/test_memory_storage.py
@@ -8,19 +8,28 @@
 from pathlib import Path
 from typing import List
 
+import pytest
+
 from metagpt.actions import UserRequirement, WritePRD
 from metagpt.actions.action_node import ActionNode
 from metagpt.const import DATA_PATH
 from metagpt.memory.memory_storage import MemoryStorage
 from metagpt.schema import Message
 from tests.metagpt.memory.mock_text_embed import (
+    mock_openai_aembed_document,
+    mock_openai_embed_document,
     mock_openai_embed_documents,
     text_embed_arr,
 )
 
 
-def test_idea_message(mocker):
-    mocker.patch("langchain_community.embeddings.openai.OpenAIEmbeddings.embed_documents", mock_openai_embed_documents)
+@pytest.mark.asyncio
+async def test_idea_message(mocker):
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embeddings", mock_openai_embed_documents)
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embedding", mock_openai_embed_document)
+    mocker.patch(
+        "llama_index.embeddings.openai.base.OpenAIEmbedding._aget_query_embedding", mock_openai_aembed_document
+    )
 
     idea = text_embed_arr[0].get("text", "Write a cli snake game")
     role_id = "UTUser1(Product Manager)"
@@ -29,28 +38,32 @@ def test_idea_message(mocker):
     shutil.rmtree(Path(DATA_PATH / f"role_mem/{role_id}/"), ignore_errors=True)
 
     memory_storage: MemoryStorage = MemoryStorage()
-    messages = memory_storage.recover_memory(role_id)
-    assert len(messages) == 0
+    memory_storage.recover_memory(role_id)
 
     memory_storage.add(message)
     assert memory_storage.is_initialized is True
 
     sim_idea = text_embed_arr[1].get("text", "Write a game of cli snake")
     sim_message = Message(role="User", content=sim_idea, cause_by=UserRequirement)
-    new_messages = memory_storage.search_dissimilar(sim_message)
-    assert len(new_messages) == 0  # similar, return []
+    new_messages = await memory_storage.search_similar(sim_message)
+    assert len(new_messages) == 1  # similar, return []
 
     new_idea = text_embed_arr[2].get("text", "Write a 2048 web game")
     new_message = Message(role="User", content=new_idea, cause_by=UserRequirement)
-    new_messages = memory_storage.search_dissimilar(new_message)
-    assert new_messages[0].content == message.content
+    new_messages = await memory_storage.search_similar(new_message)
+    assert len(new_messages) == 0
 
     memory_storage.clean()
     assert memory_storage.is_initialized is False
 
 
-def test_actionout_message(mocker):
-    mocker.patch("langchain_community.embeddings.openai.OpenAIEmbeddings.embed_documents", mock_openai_embed_documents)
+@pytest.mark.asyncio
+async def test_actionout_message(mocker):
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embeddings", mock_openai_embed_documents)
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embedding", mock_openai_embed_document)
+    mocker.patch(
+        "llama_index.embeddings.openai.base.OpenAIEmbedding._aget_query_embedding", mock_openai_aembed_document
+    )
 
     out_mapping = {"field1": (str, ...), "field2": (List[str], ...)}
     out_data = {"field1": "field1 value", "field2": ["field2 value1", "field2 value2"]}
@@ -67,23 +80,22 @@ def test_actionout_message(mocker):
     shutil.rmtree(Path(DATA_PATH / f"role_mem/{role_id}/"), ignore_errors=True)
 
     memory_storage: MemoryStorage = MemoryStorage()
-    messages = memory_storage.recover_memory(role_id)
-    assert len(messages) == 0
+    memory_storage.recover_memory(role_id)
 
     memory_storage.add(message)
     assert memory_storage.is_initialized is True
 
     sim_conent = text_embed_arr[5].get("text", "The request is command-line interface (CLI) snake game")
     sim_message = Message(content=sim_conent, instruct_content=ic_obj(**out_data), role="user", cause_by=WritePRD)
-    new_messages = memory_storage.search_dissimilar(sim_message)
-    assert len(new_messages) == 0  # similar, return []
+    new_messages = await memory_storage.search_similar(sim_message)
+    assert len(new_messages) == 1  # similar, return []
 
     new_conent = text_embed_arr[6].get(
         "text", "Incorporate basic features of a snake game such as scoring and increasing difficulty"
     )
     new_message = Message(content=new_conent, instruct_content=ic_obj(**out_data), role="user", cause_by=WritePRD)
-    new_messages = memory_storage.search_dissimilar(new_message)
-    assert new_messages[0].content == message.content
+    new_messages = await memory_storage.search_similar(new_message)
+    assert len(new_messages) == 0
 
     memory_storage.clean()
     assert memory_storage.is_initialized is False
diff --git a/tests/metagpt/provider/test_base_llm.py b/tests/metagpt/provider/test_base_llm.py
index bff8dbde46..40a9fda920 100644
--- a/tests/metagpt/provider/test_base_llm.py
+++ b/tests/metagpt/provider/test_base_llm.py
@@ -11,6 +11,7 @@
 from metagpt.configs.llm_config import LLMConfig
 from metagpt.provider.base_llm import BaseLLM
 from metagpt.schema import Message
+from tests.metagpt.provider.mock_llm_config import mock_llm_config
 from tests.metagpt.provider.req_resp_const import (
     default_resp_cont,
     get_part_chat_completion,
@@ -22,7 +23,7 @@
 
 class MockBaseLLM(BaseLLM):
     def __init__(self, config: LLMConfig = None):
-        pass
+        self.config = config or mock_llm_config
 
     def completion(self, messages: list[dict], timeout=3):
         return get_part_chat_completion(name)
diff --git a/tests/metagpt/rag/engines/test_simple.py b/tests/metagpt/rag/engines/test_simple.py
new file mode 100644
index 0000000000..9262ccb07e
--- /dev/null
+++ b/tests/metagpt/rag/engines/test_simple.py
@@ -0,0 +1,310 @@
+import json
+
+import pytest
+from llama_index.core import VectorStoreIndex
+from llama_index.core.embeddings import MockEmbedding
+from llama_index.core.llms import MockLLM
+from llama_index.core.schema import Document, NodeWithScore, TextNode
+
+from metagpt.rag.engines import SimpleEngine
+from metagpt.rag.retrievers import SimpleHybridRetriever
+from metagpt.rag.retrievers.base import ModifiableRAGRetriever, PersistableRAGRetriever
+from metagpt.rag.schema import BM25RetrieverConfig, ObjectNode
+
+
+class TestSimpleEngine:
+    @pytest.fixture
+    def mock_llm(self):
+        return MockLLM()
+
+    @pytest.fixture
+    def mock_embedding(self):
+        return MockEmbedding(embed_dim=1)
+
+    @pytest.fixture
+    def mock_simple_directory_reader(self, mocker):
+        return mocker.patch("metagpt.rag.engines.simple.SimpleDirectoryReader")
+
+    @pytest.fixture
+    def mock_vector_store_index(self, mocker):
+        return mocker.patch("metagpt.rag.engines.simple.VectorStoreIndex.from_documents")
+
+    @pytest.fixture
+    def mock_get_retriever(self, mocker):
+        return mocker.patch("metagpt.rag.engines.simple.get_retriever")
+
+    @pytest.fixture
+    def mock_get_rankers(self, mocker):
+        return mocker.patch("metagpt.rag.engines.simple.get_rankers")
+
+    @pytest.fixture
+    def mock_get_response_synthesizer(self, mocker):
+        return mocker.patch("metagpt.rag.engines.simple.get_response_synthesizer")
+
+    def test_from_docs(
+        self,
+        mocker,
+        mock_simple_directory_reader,
+        mock_vector_store_index,
+        mock_get_retriever,
+        mock_get_rankers,
+        mock_get_response_synthesizer,
+    ):
+        # Mock
+        mock_simple_directory_reader.return_value.load_data.return_value = [
+            Document(text="document1"),
+            Document(text="document2"),
+        ]
+        mock_get_retriever.return_value = mocker.MagicMock()
+        mock_get_rankers.return_value = [mocker.MagicMock()]
+        mock_get_response_synthesizer.return_value = mocker.MagicMock()
+
+        # Setup
+        input_dir = "test_dir"
+        input_files = ["test_file1", "test_file2"]
+        transformations = [mocker.MagicMock()]
+        embed_model = mocker.MagicMock()
+        llm = mocker.MagicMock()
+        retriever_configs = [mocker.MagicMock()]
+        ranker_configs = [mocker.MagicMock()]
+
+        # Exec
+        engine = SimpleEngine.from_docs(
+            input_dir=input_dir,
+            input_files=input_files,
+            transformations=transformations,
+            embed_model=embed_model,
+            llm=llm,
+            retriever_configs=retriever_configs,
+            ranker_configs=ranker_configs,
+        )
+
+        # Assert
+        mock_simple_directory_reader.assert_called_once_with(input_dir=input_dir, input_files=input_files)
+        mock_vector_store_index.assert_called_once()
+        mock_get_retriever.assert_called_once_with(
+            configs=retriever_configs, index=mock_vector_store_index.return_value
+        )
+        mock_get_rankers.assert_called_once_with(configs=ranker_configs, llm=llm)
+        mock_get_response_synthesizer.assert_called_once_with(llm=llm)
+        assert isinstance(engine, SimpleEngine)
+
+    def test_from_docs_without_file(self):
+        with pytest.raises(ValueError):
+            SimpleEngine.from_docs()
+
+    def test_from_objs(self, mock_llm, mock_embedding):
+        # Mock
+        class MockRAGObject:
+            def rag_key(self):
+                return "key"
+
+            def model_dump_json(self):
+                return "{}"
+
+        objs = [MockRAGObject()]
+
+        # Setup
+        retriever_configs = []
+        ranker_configs = []
+
+        # Exec
+        engine = SimpleEngine.from_objs(
+            objs=objs,
+            llm=mock_llm,
+            embed_model=mock_embedding,
+            retriever_configs=retriever_configs,
+            ranker_configs=ranker_configs,
+        )
+
+        # Assert
+        assert isinstance(engine, SimpleEngine)
+        assert engine.index is not None
+
+    def test_from_objs_with_bm25_config(self):
+        # Setup
+        retriever_configs = [BM25RetrieverConfig()]
+
+        # Exec
+        with pytest.raises(ValueError):
+            SimpleEngine.from_objs(
+                objs=[],
+                llm=MockLLM(),
+                retriever_configs=retriever_configs,
+                ranker_configs=[],
+            )
+
+    def test_from_index(self, mocker, mock_llm, mock_embedding):
+        # Mock
+        mock_index = mocker.MagicMock(spec=VectorStoreIndex)
+        mock_get_index = mocker.patch("metagpt.rag.engines.simple.get_index")
+        mock_get_index.return_value = mock_index
+
+        # Exec
+        engine = SimpleEngine.from_index(
+            index_config=mock_index,
+            embed_model=mock_embedding,
+            llm=mock_llm,
+        )
+
+        # Assert
+        assert isinstance(engine, SimpleEngine)
+        assert engine.index is mock_index
+
+    @pytest.mark.asyncio
+    async def test_asearch(self, mocker):
+        # Mock
+        test_query = "test query"
+        expected_result = "expected result"
+        mock_aquery = mocker.AsyncMock(return_value=expected_result)
+
+        # Setup
+        engine = SimpleEngine(retriever=mocker.MagicMock())
+        engine.aquery = mock_aquery
+
+        # Exec
+        result = await engine.asearch(test_query)
+
+        # Assert
+        mock_aquery.assert_called_once_with(test_query)
+        assert result == expected_result
+
+    @pytest.mark.asyncio
+    async def test_aretrieve(self, mocker):
+        # Mock
+        mock_query_bundle = mocker.patch("metagpt.rag.engines.simple.QueryBundle", return_value="query_bundle")
+        mock_super_aretrieve = mocker.patch(
+            "metagpt.rag.engines.simple.RetrieverQueryEngine.aretrieve", new_callable=mocker.AsyncMock
+        )
+        mock_super_aretrieve.return_value = [TextNode(text="node_with_score", metadata={"is_obj": False})]
+
+        # Setup
+        engine = SimpleEngine(retriever=mocker.MagicMock())
+        test_query = "test query"
+
+        # Exec
+        result = await engine.aretrieve(test_query)
+
+        # Assert
+        mock_query_bundle.assert_called_once_with(test_query)
+        mock_super_aretrieve.assert_called_once_with("query_bundle")
+        assert result[0].text == "node_with_score"
+
+    def test_add_docs(self, mocker):
+        # Mock
+        mock_simple_directory_reader = mocker.patch("metagpt.rag.engines.simple.SimpleDirectoryReader")
+        mock_simple_directory_reader.return_value.load_data.return_value = [
+            Document(text="document1"),
+            Document(text="document2"),
+        ]
+
+        mock_retriever = mocker.MagicMock(spec=ModifiableRAGRetriever)
+
+        mock_index = mocker.MagicMock(spec=VectorStoreIndex)
+        mock_index._transformations = mocker.MagicMock()
+
+        mock_run_transformations = mocker.patch("metagpt.rag.engines.simple.run_transformations")
+        mock_run_transformations.return_value = ["node1", "node2"]
+
+        # Setup
+        engine = SimpleEngine(retriever=mock_retriever, index=mock_index)
+        input_files = ["test_file1", "test_file2"]
+
+        # Exec
+        engine.add_docs(input_files=input_files)
+
+        # Assert
+        mock_simple_directory_reader.assert_called_once_with(input_files=input_files)
+        mock_retriever.add_nodes.assert_called_once_with(["node1", "node2"])
+
+    def test_add_objs(self, mocker):
+        # Mock
+        mock_retriever = mocker.MagicMock(spec=ModifiableRAGRetriever)
+
+        # Setup
+        class CustomTextNode(TextNode):
+            def rag_key(self):
+                return ""
+
+            def model_dump_json(self):
+                return ""
+
+        objs = [CustomTextNode(text=f"text_{i}", metadata={"obj": f"obj_{i}"}) for i in range(2)]
+        engine = SimpleEngine(retriever=mock_retriever, index=mocker.MagicMock())
+
+        # Exec
+        engine.add_objs(objs=objs)
+
+        # Assert
+        assert mock_retriever.add_nodes.call_count == 1
+        for node in mock_retriever.add_nodes.call_args[0][0]:
+            assert isinstance(node, TextNode)
+            assert "is_obj" in node.metadata
+
+    def test_persist_successfully(self, mocker):
+        # Mock
+        mock_retriever = mocker.MagicMock(spec=PersistableRAGRetriever)
+        mock_retriever.persist.return_value = mocker.MagicMock()
+
+        # Setup
+        engine = SimpleEngine(retriever=mock_retriever)
+
+        # Exec
+        engine.persist(persist_dir="")
+
+    def test_ensure_retriever_of_type(self, mocker):
+        # Mock
+        class MyRetriever:
+            def add_nodes(self):
+                ...
+
+        mock_retriever = mocker.MagicMock(spec=SimpleHybridRetriever)
+        mock_retriever.retrievers = [MyRetriever()]
+
+        # Setup
+        engine = SimpleEngine(retriever=mock_retriever)
+
+        # Assert
+        engine._ensure_retriever_of_type(ModifiableRAGRetriever)
+
+        with pytest.raises(TypeError):
+            engine._ensure_retriever_of_type(PersistableRAGRetriever)
+
+        with pytest.raises(TypeError):
+            other_engine = SimpleEngine(retriever=mocker.MagicMock(spec=ModifiableRAGRetriever))
+            other_engine._ensure_retriever_of_type(PersistableRAGRetriever)
+
+    def test_with_obj_metadata(self, mocker):
+        # Mock
+        node = NodeWithScore(
+            node=ObjectNode(
+                text="example",
+                metadata={
+                    "is_obj": True,
+                    "obj_cls_name": "ExampleObject",
+                    "obj_mod_name": "__main__",
+                    "obj_json": json.dumps({"key": "test_key", "value": "test_value"}),
+                },
+            )
+        )
+
+        class ExampleObject:
+            def __init__(self, key, value):
+                self.key = key
+                self.value = value
+
+            def __eq__(self, other):
+                return self.key == other.key and self.value == other.value
+
+        mock_import_class = mocker.patch("metagpt.rag.engines.simple.import_class")
+        mock_import_class.return_value = ExampleObject
+
+        # Setup
+        SimpleEngine._try_reconstruct_obj([node])
+
+        # Exec
+        expected_obj = ExampleObject(key="test_key", value="test_value")
+
+        # Assert
+        assert "obj" in node.node.metadata
+        assert node.node.metadata["obj"] == expected_obj
diff --git a/tests/metagpt/rag/factories/test_base.py b/tests/metagpt/rag/factories/test_base.py
new file mode 100644
index 0000000000..1d41e18721
--- /dev/null
+++ b/tests/metagpt/rag/factories/test_base.py
@@ -0,0 +1,102 @@
+import pytest
+
+from metagpt.rag.factories.base import ConfigBasedFactory, GenericFactory
+
+
+class TestGenericFactory:
+    @pytest.fixture
+    def creators(self):
+        return {
+            "type1": lambda name: f"Instance of type1 with {name}",
+            "type2": lambda name: f"Instance of type2 with {name}",
+        }
+
+    @pytest.fixture
+    def factory(self, creators):
+        return GenericFactory(creators=creators)
+
+    def test_get_instance_success(self, factory):
+        # Test successful retrieval of an instance
+        key = "type1"
+        instance = factory.get_instance(key, name="TestName")
+        assert instance == "Instance of type1 with TestName"
+
+    def test_get_instance_failure(self, factory):
+        # Test failure to retrieve an instance due to unregistered key
+        with pytest.raises(ValueError) as exc_info:
+            factory.get_instance("unknown_key")
+        assert "Creator not registered for key: unknown_key" in str(exc_info.value)
+
+    def test_get_instances_success(self, factory):
+        # Test successful retrieval of multiple instances
+        keys = ["type1", "type2"]
+        instances = factory.get_instances(keys, name="TestName")
+        expected = ["Instance of type1 with TestName", "Instance of type2 with TestName"]
+        assert instances == expected
+
+    @pytest.mark.parametrize(
+        "keys,expected_exception_message",
+        [
+            (["unknown_key"], "Creator not registered for key: unknown_key"),
+            (["type1", "unknown_key"], "Creator not registered for key: unknown_key"),
+        ],
+    )
+    def test_get_instances_with_failure(self, factory, keys, expected_exception_message):
+        # Test failure to retrieve instances due to at least one unregistered key
+        with pytest.raises(ValueError) as exc_info:
+            factory.get_instances(keys, name="TestName")
+        assert expected_exception_message in str(exc_info.value)
+
+
+class DummyConfig:
+    """A dummy config class for testing."""
+
+    def __init__(self, name):
+        self.name = name
+
+
+class TestConfigBasedFactory:
+    @pytest.fixture
+    def config_creators(self):
+        return {
+            DummyConfig: lambda config, **kwargs: f"Processed {config.name} with {kwargs.get('extra', 'no extra')}",
+        }
+
+    @pytest.fixture
+    def config_factory(self, config_creators):
+        return ConfigBasedFactory(creators=config_creators)
+
+    def test_get_instance_success(self, config_factory):
+        # Test successful retrieval of an instance
+        config = DummyConfig(name="TestConfig")
+        instance = config_factory.get_instance(config, extra="additional data")
+        assert instance == "Processed TestConfig with additional data"
+
+    def test_get_instance_failure(self, config_factory):
+        # Test failure to retrieve an instance due to unknown config type
+        class UnknownConfig:
+            pass
+
+        config = UnknownConfig()
+        with pytest.raises(ValueError) as exc_info:
+            config_factory.get_instance(config)
+        assert "Unknown config:" in str(exc_info.value)
+
+    def test_val_from_config_or_kwargs_priority(self):
+        # Test that the value from the config object has priority over kwargs
+        config = DummyConfig(name="ConfigName")
+        result = ConfigBasedFactory._val_from_config_or_kwargs("name", config, name="KwargsName")
+        assert result == "ConfigName"
+
+    def test_val_from_config_or_kwargs_fallback_to_kwargs(self):
+        # Test fallback to kwargs when config object does not have the value
+        config = DummyConfig(name=None)
+        result = ConfigBasedFactory._val_from_config_or_kwargs("name", config, name="KwargsName")
+        assert result == "KwargsName"
+
+    def test_val_from_config_or_kwargs_key_error(self):
+        # Test KeyError when the key is not found in both config object and kwargs
+        config = DummyConfig(name=None)
+        with pytest.raises(KeyError) as exc_info:
+            ConfigBasedFactory._val_from_config_or_kwargs("missing_key", config)
+        assert "The key 'missing_key' is required but not provided" in str(exc_info.value)
diff --git a/tests/metagpt/rag/factories/test_embedding.py b/tests/metagpt/rag/factories/test_embedding.py
new file mode 100644
index 0000000000..1a9e9b2c97
--- /dev/null
+++ b/tests/metagpt/rag/factories/test_embedding.py
@@ -0,0 +1,106 @@
+import pytest
+
+from metagpt.configs.embedding_config import EmbeddingType
+from metagpt.configs.llm_config import LLMType
+from metagpt.rag.factories.embedding import RAGEmbeddingFactory
+
+
+class TestRAGEmbeddingFactory:
+    @pytest.fixture(autouse=True)
+    def mock_embedding_factory(self):
+        self.embedding_factory = RAGEmbeddingFactory()
+
+    @pytest.fixture
+    def mock_config(self, mocker):
+        return mocker.patch("metagpt.rag.factories.embedding.config")
+
+    @staticmethod
+    def mock_openai_embedding(mocker):
+        return mocker.patch("metagpt.rag.factories.embedding.OpenAIEmbedding")
+
+    @staticmethod
+    def mock_azure_embedding(mocker):
+        return mocker.patch("metagpt.rag.factories.embedding.AzureOpenAIEmbedding")
+
+    @staticmethod
+    def mock_gemini_embedding(mocker):
+        return mocker.patch("metagpt.rag.factories.embedding.GeminiEmbedding")
+
+    @staticmethod
+    def mock_ollama_embedding(mocker):
+        return mocker.patch("metagpt.rag.factories.embedding.OllamaEmbedding")
+
+    @pytest.mark.parametrize(
+        ("mock_func", "embedding_type"),
+        [
+            (mock_openai_embedding, LLMType.OPENAI),
+            (mock_azure_embedding, LLMType.AZURE),
+            (mock_openai_embedding, EmbeddingType.OPENAI),
+            (mock_azure_embedding, EmbeddingType.AZURE),
+            (mock_gemini_embedding, EmbeddingType.GEMINI),
+            (mock_ollama_embedding, EmbeddingType.OLLAMA),
+        ],
+    )
+    def test_get_rag_embedding(self, mock_func, embedding_type, mocker):
+        # Mock
+        mock = mock_func(mocker)
+
+        # Exec
+        self.embedding_factory.get_rag_embedding(embedding_type)
+
+        # Assert
+        mock.assert_called_once()
+
+    def test_get_rag_embedding_default(self, mocker, mock_config):
+        # Mock
+        mock_openai_embedding = self.mock_openai_embedding(mocker)
+
+        mock_config.embedding.api_type = None
+        mock_config.llm.api_type = LLMType.OPENAI
+
+        # Exec
+        self.embedding_factory.get_rag_embedding()
+
+        # Assert
+        mock_openai_embedding.assert_called_once()
+
+    @pytest.mark.parametrize(
+        "model, embed_batch_size, expected_params",
+        [("test_model", 100, {"model_name": "test_model", "embed_batch_size": 100}), (None, None, {})],
+    )
+    def test_try_set_model_and_batch_size(self, mock_config, model, embed_batch_size, expected_params):
+        # Mock
+        mock_config.embedding.model = model
+        mock_config.embedding.embed_batch_size = embed_batch_size
+
+        # Setup
+        test_params = {}
+
+        # Exec
+        self.embedding_factory._try_set_model_and_batch_size(test_params)
+
+        # Assert
+        assert test_params == expected_params
+
+    def test_resolve_embedding_type(self, mock_config):
+        # Mock
+        mock_config.embedding.api_type = EmbeddingType.OPENAI
+
+        # Exec
+        embedding_type = self.embedding_factory._resolve_embedding_type()
+
+        # Assert
+        assert embedding_type == EmbeddingType.OPENAI
+
+    def test_resolve_embedding_type_exception(self, mock_config):
+        # Mock
+        mock_config.embedding.api_type = None
+        mock_config.llm.api_type = LLMType.GEMINI
+
+        # Assert
+        with pytest.raises(TypeError):
+            self.embedding_factory._resolve_embedding_type()
+
+    def test_raise_for_key(self):
+        with pytest.raises(ValueError):
+            self.embedding_factory._raise_for_key("key")
diff --git a/tests/metagpt/rag/factories/test_index.py b/tests/metagpt/rag/factories/test_index.py
new file mode 100644
index 0000000000..9dc5bfb6be
--- /dev/null
+++ b/tests/metagpt/rag/factories/test_index.py
@@ -0,0 +1,89 @@
+import pytest
+from llama_index.core.embeddings import MockEmbedding
+
+from metagpt.rag.factories.index import RAGIndexFactory
+from metagpt.rag.schema import (
+    BM25IndexConfig,
+    ChromaIndexConfig,
+    ElasticsearchIndexConfig,
+    ElasticsearchStoreConfig,
+    FAISSIndexConfig,
+)
+
+
+class TestRAGIndexFactory:
+    @pytest.fixture(autouse=True)
+    def setup(self):
+        self.index_factory = RAGIndexFactory()
+
+    @pytest.fixture
+    def faiss_config(self):
+        return FAISSIndexConfig(persist_path="")
+
+    @pytest.fixture
+    def chroma_config(self):
+        return ChromaIndexConfig(persist_path="", collection_name="")
+
+    @pytest.fixture
+    def bm25_config(self):
+        return BM25IndexConfig(persist_path="")
+
+    @pytest.fixture
+    def es_config(self, mocker):
+        return ElasticsearchIndexConfig(store_config=ElasticsearchStoreConfig())
+
+    @pytest.fixture
+    def mock_storage_context(self, mocker):
+        return mocker.patch("metagpt.rag.factories.index.StorageContext.from_defaults")
+
+    @pytest.fixture
+    def mock_load_index_from_storage(self, mocker):
+        return mocker.patch("metagpt.rag.factories.index.load_index_from_storage")
+
+    @pytest.fixture
+    def mock_from_vector_store(self, mocker):
+        return mocker.patch("metagpt.rag.factories.index.VectorStoreIndex.from_vector_store")
+
+    @pytest.fixture
+    def mock_embedding(self):
+        return MockEmbedding(embed_dim=1)
+
+    def test_create_faiss_index(
+        self, mocker, faiss_config, mock_storage_context, mock_load_index_from_storage, mock_embedding
+    ):
+        # Mock
+        mock_faiss_store = mocker.patch("metagpt.rag.factories.index.FaissVectorStore.from_persist_dir")
+
+        # Exec
+        self.index_factory.get_index(faiss_config, embed_model=mock_embedding)
+
+        # Assert
+        mock_faiss_store.assert_called_once()
+
+    def test_create_bm25_index(
+        self, mocker, bm25_config, mock_storage_context, mock_load_index_from_storage, mock_embedding
+    ):
+        self.index_factory.get_index(bm25_config, embed_model=mock_embedding)
+
+    def test_create_chroma_index(self, mocker, chroma_config, mock_from_vector_store, mock_embedding):
+        # Mock
+        mock_chroma_db = mocker.patch("metagpt.rag.factories.index.chromadb.PersistentClient")
+        mock_chroma_db.get_or_create_collection.return_value = mocker.MagicMock()
+
+        mock_chroma_store = mocker.patch("metagpt.rag.factories.index.ChromaVectorStore")
+
+        # Exec
+        self.index_factory.get_index(chroma_config, embed_model=mock_embedding)
+
+        # Assert
+        mock_chroma_store.assert_called_once()
+
+    def test_create_es_index(self, mocker, es_config, mock_from_vector_store, mock_embedding):
+        # Mock
+        mock_es_store = mocker.patch("metagpt.rag.factories.index.ElasticsearchStore")
+
+        # Exec
+        self.index_factory.get_index(es_config, embed_model=mock_embedding)
+
+        # Assert
+        mock_es_store.assert_called_once()
diff --git a/tests/metagpt/rag/factories/test_llm.py b/tests/metagpt/rag/factories/test_llm.py
new file mode 100644
index 0000000000..e11b87076c
--- /dev/null
+++ b/tests/metagpt/rag/factories/test_llm.py
@@ -0,0 +1,71 @@
+from typing import Optional, Union
+
+import pytest
+from llama_index.core.llms import LLMMetadata
+
+from metagpt.configs.llm_config import LLMConfig
+from metagpt.const import USE_CONFIG_TIMEOUT
+from metagpt.provider.base_llm import BaseLLM
+from metagpt.rag.factories.llm import RAGLLM, get_rag_llm
+
+
+class MockLLM(BaseLLM):
+    def __init__(self, config: LLMConfig):
+        ...
+
+    async def _achat_completion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT):
+        """_achat_completion implemented by inherited class"""
+
+    async def acompletion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT):
+        return "ok"
+
+    def completion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT):
+        return "ok"
+
+    async def _achat_completion_stream(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> str:
+        """_achat_completion_stream implemented by inherited class"""
+
+    async def aask(
+        self,
+        msg: Union[str, list[dict[str, str]]],
+        system_msgs: Optional[list[str]] = None,
+        format_msgs: Optional[list[dict[str, str]]] = None,
+        images: Optional[Union[str, list[str]]] = None,
+        timeout=USE_CONFIG_TIMEOUT,
+        stream=True,
+    ) -> str:
+        return "ok"
+
+
+class TestRAGLLM:
+    @pytest.fixture
+    def mock_model_infer(self):
+        return MockLLM(config=LLMConfig())
+
+    @pytest.fixture
+    def rag_llm(self, mock_model_infer):
+        return RAGLLM(model_infer=mock_model_infer)
+
+    def test_metadata(self, rag_llm):
+        metadata = rag_llm.metadata
+        assert isinstance(metadata, LLMMetadata)
+        assert metadata.context_window == rag_llm.context_window
+        assert metadata.num_output == rag_llm.num_output
+        assert metadata.model_name == rag_llm.model_name
+
+    @pytest.mark.asyncio
+    async def test_acomplete(self, rag_llm, mock_model_infer):
+        response = await rag_llm.acomplete("question")
+        assert response.text == "ok"
+
+    def test_complete(self, rag_llm, mock_model_infer):
+        response = rag_llm.complete("question")
+        assert response.text == "ok"
+
+    def test_stream_complete(self, rag_llm, mock_model_infer):
+        rag_llm.stream_complete("question")
+
+
+def test_get_rag_llm():
+    result = get_rag_llm(MockLLM(config=LLMConfig()))
+    assert isinstance(result, RAGLLM)
diff --git a/tests/metagpt/rag/factories/test_ranker.py b/tests/metagpt/rag/factories/test_ranker.py
new file mode 100644
index 0000000000..e40f7f8dff
--- /dev/null
+++ b/tests/metagpt/rag/factories/test_ranker.py
@@ -0,0 +1,60 @@
+import contextlib
+
+import pytest
+from llama_index.core.llms import MockLLM
+from llama_index.core.postprocessor import LLMRerank
+
+from metagpt.rag.factories.ranker import RankerFactory
+from metagpt.rag.schema import ColbertRerankConfig, LLMRankerConfig, ObjectRankerConfig
+
+
+class TestRankerFactory:
+    @pytest.fixture(autouse=True)
+    def ranker_factory(self):
+        self.ranker_factory: RankerFactory = RankerFactory()
+
+    @pytest.fixture
+    def mock_llm(self):
+        return MockLLM()
+
+    def test_get_rankers_with_no_configs(self, mock_llm, mocker):
+        mocker.patch.object(self.ranker_factory, "_extract_llm", return_value=mock_llm)
+        default_rankers = self.ranker_factory.get_rankers()
+        assert len(default_rankers) == 0
+
+    def test_get_rankers_with_configs(self, mock_llm):
+        mock_config = LLMRankerConfig(llm=mock_llm)
+        rankers = self.ranker_factory.get_rankers(configs=[mock_config])
+        assert len(rankers) == 1
+        assert isinstance(rankers[0], LLMRerank)
+
+    def test_extract_llm_from_config(self, mock_llm):
+        mock_config = LLMRankerConfig(llm=mock_llm)
+        extracted_llm = self.ranker_factory._extract_llm(config=mock_config)
+        assert extracted_llm == mock_llm
+
+    def test_extract_llm_from_kwargs(self, mock_llm):
+        extracted_llm = self.ranker_factory._extract_llm(llm=mock_llm)
+        assert extracted_llm == mock_llm
+
+    def test_create_llm_ranker(self, mock_llm):
+        mock_config = LLMRankerConfig(llm=mock_llm)
+        ranker = self.ranker_factory._create_llm_ranker(mock_config)
+        assert isinstance(ranker, LLMRerank)
+
+    def test_create_colbert_ranker(self, mocker, mock_llm):
+        with contextlib.suppress(ImportError):
+            mocker.patch("llama_index.postprocessor.colbert_rerank.ColbertRerank", return_value="colbert")
+
+            mock_config = ColbertRerankConfig(llm=mock_llm)
+            ranker = self.ranker_factory._create_colbert_ranker(mock_config)
+
+            assert ranker == "colbert"
+
+    def test_create_object_ranker(self, mocker, mock_llm):
+        mocker.patch("metagpt.rag.factories.ranker.ObjectSortPostprocessor", return_value="object")
+
+        mock_config = ObjectRankerConfig(field_name="fake", llm=mock_llm)
+        ranker = self.ranker_factory._create_object_ranker(mock_config)
+
+        assert ranker == "object"
diff --git a/tests/metagpt/rag/factories/test_retriever.py b/tests/metagpt/rag/factories/test_retriever.py
new file mode 100644
index 0000000000..ef1cef7e00
--- /dev/null
+++ b/tests/metagpt/rag/factories/test_retriever.py
@@ -0,0 +1,113 @@
+import faiss
+import pytest
+from llama_index.core import VectorStoreIndex
+from llama_index.vector_stores.chroma import ChromaVectorStore
+from llama_index.vector_stores.elasticsearch import ElasticsearchStore
+
+from metagpt.rag.factories.retriever import RetrieverFactory
+from metagpt.rag.retrievers.bm25_retriever import DynamicBM25Retriever
+from metagpt.rag.retrievers.chroma_retriever import ChromaRetriever
+from metagpt.rag.retrievers.es_retriever import ElasticsearchRetriever
+from metagpt.rag.retrievers.faiss_retriever import FAISSRetriever
+from metagpt.rag.retrievers.hybrid_retriever import SimpleHybridRetriever
+from metagpt.rag.schema import (
+    BM25RetrieverConfig,
+    ChromaRetrieverConfig,
+    ElasticsearchRetrieverConfig,
+    ElasticsearchStoreConfig,
+    FAISSRetrieverConfig,
+)
+
+
+class TestRetrieverFactory:
+    @pytest.fixture(autouse=True)
+    def retriever_factory(self):
+        self.retriever_factory: RetrieverFactory = RetrieverFactory()
+
+    @pytest.fixture
+    def mock_faiss_index(self, mocker):
+        return mocker.MagicMock(spec=faiss.IndexFlatL2)
+
+    @pytest.fixture
+    def mock_vector_store_index(self, mocker):
+        mock = mocker.MagicMock(spec=VectorStoreIndex)
+        mock._embed_model = mocker.MagicMock()
+        mock.docstore.docs.values.return_value = []
+        return mock
+
+    @pytest.fixture
+    def mock_chroma_vector_store(self, mocker):
+        return mocker.MagicMock(spec=ChromaVectorStore)
+
+    @pytest.fixture
+    def mock_es_vector_store(self, mocker):
+        return mocker.MagicMock(spec=ElasticsearchStore)
+
+    def test_get_retriever_with_faiss_config(self, mock_faiss_index, mocker, mock_vector_store_index):
+        mock_config = FAISSRetrieverConfig(dimensions=128)
+        mocker.patch("faiss.IndexFlatL2", return_value=mock_faiss_index)
+        mocker.patch.object(self.retriever_factory, "_extract_index", return_value=mock_vector_store_index)
+
+        retriever = self.retriever_factory.get_retriever(configs=[mock_config])
+
+        assert isinstance(retriever, FAISSRetriever)
+
+    def test_get_retriever_with_bm25_config(self, mocker, mock_vector_store_index):
+        mock_config = BM25RetrieverConfig()
+        mocker.patch("rank_bm25.BM25Okapi.__init__", return_value=None)
+        mocker.patch.object(self.retriever_factory, "_extract_index", return_value=mock_vector_store_index)
+
+        retriever = self.retriever_factory.get_retriever(configs=[mock_config])
+
+        assert isinstance(retriever, DynamicBM25Retriever)
+
+    def test_get_retriever_with_multiple_configs_returns_hybrid(self, mocker, mock_vector_store_index):
+        mock_faiss_config = FAISSRetrieverConfig(dimensions=128)
+        mock_bm25_config = BM25RetrieverConfig()
+        mocker.patch("rank_bm25.BM25Okapi.__init__", return_value=None)
+        mocker.patch.object(self.retriever_factory, "_extract_index", return_value=mock_vector_store_index)
+
+        retriever = self.retriever_factory.get_retriever(configs=[mock_faiss_config, mock_bm25_config])
+
+        assert isinstance(retriever, SimpleHybridRetriever)
+
+    def test_get_retriever_with_chroma_config(self, mocker, mock_vector_store_index, mock_chroma_vector_store):
+        mock_config = ChromaRetrieverConfig(persist_path="/path/to/chroma", collection_name="test_collection")
+        mock_chromadb = mocker.patch("metagpt.rag.factories.retriever.chromadb.PersistentClient")
+        mock_chromadb.get_or_create_collection.return_value = mocker.MagicMock()
+        mocker.patch("metagpt.rag.factories.retriever.ChromaVectorStore", return_value=mock_chroma_vector_store)
+        mocker.patch.object(self.retriever_factory, "_extract_index", return_value=mock_vector_store_index)
+
+        retriever = self.retriever_factory.get_retriever(configs=[mock_config])
+
+        assert isinstance(retriever, ChromaRetriever)
+
+    def test_get_retriever_with_es_config(self, mocker, mock_vector_store_index, mock_es_vector_store):
+        mock_config = ElasticsearchRetrieverConfig(store_config=ElasticsearchStoreConfig())
+        mocker.patch("metagpt.rag.factories.retriever.ElasticsearchStore", return_value=mock_es_vector_store)
+        mocker.patch.object(self.retriever_factory, "_extract_index", return_value=mock_vector_store_index)
+
+        retriever = self.retriever_factory.get_retriever(configs=[mock_config])
+
+        assert isinstance(retriever, ElasticsearchRetriever)
+
+    def test_create_default_retriever(self, mocker, mock_vector_store_index):
+        mocker.patch.object(self.retriever_factory, "_extract_index", return_value=mock_vector_store_index)
+        mock_vector_store_index.as_retriever = mocker.MagicMock()
+
+        retriever = self.retriever_factory.get_retriever()
+
+        mock_vector_store_index.as_retriever.assert_called_once()
+        assert retriever is mock_vector_store_index.as_retriever.return_value
+
+    def test_extract_index_from_config(self, mock_vector_store_index):
+        mock_config = FAISSRetrieverConfig(index=mock_vector_store_index)
+
+        extracted_index = self.retriever_factory._extract_index(config=mock_config)
+
+        assert extracted_index == mock_vector_store_index
+
+    def test_extract_index_from_kwargs(self, mock_vector_store_index):
+        extracted_index = self.retriever_factory._extract_index(index=mock_vector_store_index)
+
+        assert extracted_index == mock_vector_store_index
diff --git a/tests/metagpt/rag/rankers/test_base_ranker.py b/tests/metagpt/rag/rankers/test_base_ranker.py
new file mode 100644
index 0000000000..9755949f6a
--- /dev/null
+++ b/tests/metagpt/rag/rankers/test_base_ranker.py
@@ -0,0 +1,23 @@
+import pytest
+from llama_index.core.schema import NodeWithScore, QueryBundle, TextNode
+
+from metagpt.rag.rankers.base import RAGRanker
+
+
+class SimpleRAGRanker(RAGRanker):
+    def _postprocess_nodes(self, nodes, query_bundle=None):
+        return [NodeWithScore(node=node.node, score=node.score + 1) for node in nodes]
+
+
+class TestSimpleRAGRanker:
+    @pytest.fixture
+    def ranker(self):
+        return SimpleRAGRanker()
+
+    def test_postprocess_nodes_increases_scores(self, ranker):
+        nodes = [NodeWithScore(node=TextNode(text="a"), score=10), NodeWithScore(node=TextNode(text="b"), score=20)]
+        query_bundle = QueryBundle(query_str="test query")
+
+        processed_nodes = ranker._postprocess_nodes(nodes, query_bundle)
+
+        assert all(node.score == original_node.score + 1 for node, original_node in zip(processed_nodes, nodes))
diff --git a/tests/metagpt/rag/rankers/test_object_ranker.py b/tests/metagpt/rag/rankers/test_object_ranker.py
new file mode 100644
index 0000000000..4a9f66a42d
--- /dev/null
+++ b/tests/metagpt/rag/rankers/test_object_ranker.py
@@ -0,0 +1,69 @@
+import json
+
+import pytest
+from llama_index.core.schema import NodeWithScore, QueryBundle
+from pydantic import BaseModel
+
+from metagpt.rag.rankers.object_ranker import ObjectSortPostprocessor
+from metagpt.rag.schema import ObjectNode
+
+
+class Record(BaseModel):
+    score: int
+
+
+class TestObjectSortPostprocessor:
+    @pytest.fixture
+    def mock_nodes_with_scores(self):
+        nodes = [
+            NodeWithScore(node=ObjectNode(metadata={"obj_json": Record(score=10).model_dump_json()}), score=10),
+            NodeWithScore(node=ObjectNode(metadata={"obj_json": Record(score=20).model_dump_json()}), score=20),
+            NodeWithScore(node=ObjectNode(metadata={"obj_json": Record(score=5).model_dump_json()}), score=5),
+        ]
+        return nodes
+
+    @pytest.fixture
+    def mock_query_bundle(self, mocker):
+        return mocker.MagicMock(spec=QueryBundle)
+
+    def test_sort_descending(self, mock_nodes_with_scores, mock_query_bundle):
+        postprocessor = ObjectSortPostprocessor(field_name="score", order="desc")
+        sorted_nodes = postprocessor._postprocess_nodes(mock_nodes_with_scores, mock_query_bundle)
+        assert [node.score for node in sorted_nodes] == [20, 10, 5]
+
+    def test_sort_ascending(self, mock_nodes_with_scores, mock_query_bundle):
+        postprocessor = ObjectSortPostprocessor(field_name="score", order="asc")
+        sorted_nodes = postprocessor._postprocess_nodes(mock_nodes_with_scores, mock_query_bundle)
+        assert [node.score for node in sorted_nodes] == [5, 10, 20]
+
+    def test_top_n_limit(self, mock_nodes_with_scores, mock_query_bundle):
+        postprocessor = ObjectSortPostprocessor(field_name="score", order="desc", top_n=2)
+        sorted_nodes = postprocessor._postprocess_nodes(mock_nodes_with_scores, mock_query_bundle)
+        assert len(sorted_nodes) == 2
+        assert [node.score for node in sorted_nodes] == [20, 10]
+
+    def test_invalid_json_metadata(self, mock_query_bundle):
+        nodes = [NodeWithScore(node=ObjectNode(metadata={"obj_json": "invalid_json"}), score=10)]
+        postprocessor = ObjectSortPostprocessor(field_name="score", order="desc")
+        with pytest.raises(ValueError):
+            postprocessor._postprocess_nodes(nodes, mock_query_bundle)
+
+    def test_missing_query_bundle(self, mock_nodes_with_scores):
+        postprocessor = ObjectSortPostprocessor(field_name="score", order="desc")
+        with pytest.raises(ValueError):
+            postprocessor._postprocess_nodes(mock_nodes_with_scores, query_bundle=None)
+
+    def test_field_not_found_in_object(self, mock_query_bundle):
+        nodes = [NodeWithScore(node=ObjectNode(metadata={"obj_json": json.dumps({"not_score": 10})}), score=10)]
+        postprocessor = ObjectSortPostprocessor(field_name="score", order="desc")
+        with pytest.raises(ValueError):
+            postprocessor._postprocess_nodes(nodes, query_bundle=mock_query_bundle)
+
+    def test_not_nodes(self, mock_query_bundle):
+        nodes = []
+        postprocessor = ObjectSortPostprocessor(field_name="score", order="desc")
+        result = postprocessor._postprocess_nodes(nodes, mock_query_bundle)
+        assert result == []
+
+    def test_class_name(self):
+        assert ObjectSortPostprocessor.class_name() == "ObjectSortPostprocessor"
diff --git a/tests/metagpt/rag/retrievers/test_base_retriever.py b/tests/metagpt/rag/retrievers/test_base_retriever.py
new file mode 100644
index 0000000000..1065b9731d
--- /dev/null
+++ b/tests/metagpt/rag/retrievers/test_base_retriever.py
@@ -0,0 +1,21 @@
+from metagpt.rag.retrievers.base import ModifiableRAGRetriever, PersistableRAGRetriever
+
+
+class SubModifiableRAGRetriever(ModifiableRAGRetriever):
+    ...
+
+
+class SubPersistableRAGRetriever(PersistableRAGRetriever):
+    ...
+
+
+class TestModifiableRAGRetriever:
+    def test_subclasshook(self):
+        result = SubModifiableRAGRetriever.__subclasshook__(SubModifiableRAGRetriever)
+        assert result is NotImplemented
+
+
+class TestPersistableRAGRetriever:
+    def test_subclasshook(self):
+        result = SubPersistableRAGRetriever.__subclasshook__(SubPersistableRAGRetriever)
+        assert result is NotImplemented
diff --git a/tests/metagpt/rag/retrievers/test_bm25_retriever.py b/tests/metagpt/rag/retrievers/test_bm25_retriever.py
new file mode 100644
index 0000000000..5a569f1036
--- /dev/null
+++ b/tests/metagpt/rag/retrievers/test_bm25_retriever.py
@@ -0,0 +1,37 @@
+import pytest
+from llama_index.core import VectorStoreIndex
+from llama_index.core.schema import Node
+
+from metagpt.rag.retrievers.bm25_retriever import DynamicBM25Retriever
+
+
+class TestDynamicBM25Retriever:
+    @pytest.fixture(autouse=True)
+    def setup(self, mocker):
+        self.doc1 = mocker.MagicMock(spec=Node)
+        self.doc1.get_content.return_value = "Document content 1"
+        self.doc2 = mocker.MagicMock(spec=Node)
+        self.doc2.get_content.return_value = "Document content 2"
+        self.mock_nodes = [self.doc1, self.doc2]
+
+        index = mocker.MagicMock(spec=VectorStoreIndex)
+        index.storage_context.persist.return_value = "ok"
+
+        mock_nodes = []
+        mock_tokenizer = mocker.MagicMock()
+        self.mock_bm25okapi = mocker.patch("rank_bm25.BM25Okapi.__init__", return_value=None)
+
+        self.retriever = DynamicBM25Retriever(nodes=mock_nodes, tokenizer=mock_tokenizer, index=index)
+
+    def test_add_docs_updates_nodes_and_corpus(self):
+        # Exec
+        self.retriever.add_nodes(self.mock_nodes)
+
+        # Assert
+        assert len(self.retriever._nodes) == len(self.mock_nodes)
+        assert len(self.retriever._corpus) == len(self.mock_nodes)
+        self.retriever._tokenizer.assert_called()
+        self.mock_bm25okapi.assert_called()
+
+    def test_persist(self):
+        self.retriever.persist("")
diff --git a/tests/metagpt/rag/retrievers/test_chroma_retriever.py b/tests/metagpt/rag/retrievers/test_chroma_retriever.py
new file mode 100644
index 0000000000..cf07903cf2
--- /dev/null
+++ b/tests/metagpt/rag/retrievers/test_chroma_retriever.py
@@ -0,0 +1,20 @@
+import pytest
+from llama_index.core.schema import Node
+
+from metagpt.rag.retrievers.chroma_retriever import ChromaRetriever
+
+
+class TestChromaRetriever:
+    @pytest.fixture(autouse=True)
+    def setup(self, mocker):
+        self.doc1 = mocker.MagicMock(spec=Node)
+        self.doc2 = mocker.MagicMock(spec=Node)
+        self.mock_nodes = [self.doc1, self.doc2]
+
+        self.mock_index = mocker.MagicMock()
+        self.retriever = ChromaRetriever(self.mock_index)
+
+    def test_add_nodes(self):
+        self.retriever.add_nodes(self.mock_nodes)
+
+        self.mock_index.insert_nodes.assert_called()
diff --git a/tests/metagpt/rag/retrievers/test_es_retriever.py b/tests/metagpt/rag/retrievers/test_es_retriever.py
new file mode 100644
index 0000000000..1824bfbd28
--- /dev/null
+++ b/tests/metagpt/rag/retrievers/test_es_retriever.py
@@ -0,0 +1,20 @@
+import pytest
+from llama_index.core.schema import Node
+
+from metagpt.rag.retrievers.es_retriever import ElasticsearchRetriever
+
+
+class TestElasticsearchRetriever:
+    @pytest.fixture(autouse=True)
+    def setup(self, mocker):
+        self.doc1 = mocker.MagicMock(spec=Node)
+        self.doc2 = mocker.MagicMock(spec=Node)
+        self.mock_nodes = [self.doc1, self.doc2]
+
+        self.mock_index = mocker.MagicMock()
+        self.retriever = ElasticsearchRetriever(self.mock_index)
+
+    def test_add_nodes(self):
+        self.retriever.add_nodes(self.mock_nodes)
+
+        self.mock_index.insert_nodes.assert_called()
diff --git a/tests/metagpt/rag/retrievers/test_faiss_retriever.py b/tests/metagpt/rag/retrievers/test_faiss_retriever.py
new file mode 100644
index 0000000000..8546732157
--- /dev/null
+++ b/tests/metagpt/rag/retrievers/test_faiss_retriever.py
@@ -0,0 +1,25 @@
+import pytest
+from llama_index.core.schema import Node
+
+from metagpt.rag.retrievers.faiss_retriever import FAISSRetriever
+
+
+class TestFAISSRetriever:
+    @pytest.fixture(autouse=True)
+    def setup(self, mocker):
+        self.doc1 = mocker.MagicMock(spec=Node)
+        self.doc2 = mocker.MagicMock(spec=Node)
+        self.mock_nodes = [self.doc1, self.doc2]
+
+        self.mock_index = mocker.MagicMock()
+        self.retriever = FAISSRetriever(self.mock_index)
+
+    def test_add_docs_calls_insert_for_each_document(self):
+        self.retriever.add_nodes(self.mock_nodes)
+
+        self.mock_index.insert_nodes.assert_called()
+
+    def test_persist(self):
+        self.retriever.persist("")
+
+        self.mock_index.storage_context.persist.assert_called()
diff --git a/tests/metagpt/rag/retrievers/test_hybrid_retriever.py b/tests/metagpt/rag/retrievers/test_hybrid_retriever.py
new file mode 100644
index 0000000000..da150d8793
--- /dev/null
+++ b/tests/metagpt/rag/retrievers/test_hybrid_retriever.py
@@ -0,0 +1,57 @@
+import pytest
+from llama_index.core.schema import NodeWithScore, TextNode
+
+from metagpt.rag.retrievers import SimpleHybridRetriever
+
+
+class TestSimpleHybridRetriever:
+    @pytest.fixture
+    def mock_retriever(self, mocker):
+        return mocker.MagicMock()
+
+    @pytest.fixture
+    def mock_hybrid_retriever(self, mock_retriever) -> SimpleHybridRetriever:
+        return SimpleHybridRetriever(mock_retriever)
+
+    @pytest.fixture
+    def mock_node(self):
+        return NodeWithScore(node=TextNode(id_="2"), score=0.95)
+
+    @pytest.mark.asyncio
+    async def test_aretrieve(self, mocker):
+        question = "test query"
+
+        # Create mock retrievers
+        mock_retriever1 = mocker.AsyncMock()
+        mock_retriever1.aretrieve.return_value = [
+            NodeWithScore(node=TextNode(id_="1"), score=1.0),
+            NodeWithScore(node=TextNode(id_="2"), score=0.95),
+        ]
+
+        mock_retriever2 = mocker.AsyncMock()
+        mock_retriever2.aretrieve.return_value = [
+            NodeWithScore(node=TextNode(id_="2"), score=0.95),
+            NodeWithScore(node=TextNode(id_="3"), score=0.8),
+        ]
+
+        # Instantiate the SimpleHybridRetriever with the mock retrievers
+        hybrid_retriever = SimpleHybridRetriever(mock_retriever1, mock_retriever2)
+
+        # Call the _aretrieve method
+        results = await hybrid_retriever._aretrieve(question)
+
+        # Check if the results are as expected
+        assert len(results) == 3  # Should be 3 unique nodes
+        assert set(node.node.node_id for node in results) == {"1", "2", "3"}
+
+        # Check if the scores are correct (assuming you want the highest score)
+        node_scores = {node.node.node_id: node.score for node in results}
+        assert node_scores["2"] == 0.95
+
+    def test_add_nodes(self, mock_hybrid_retriever: SimpleHybridRetriever, mock_node):
+        mock_hybrid_retriever.add_nodes([mock_node])
+        mock_hybrid_retriever.retrievers[0].add_nodes.assert_called_once()
+
+    def test_persist(self, mock_hybrid_retriever: SimpleHybridRetriever):
+        mock_hybrid_retriever.persist("")
+        mock_hybrid_retriever.retrievers[0].persist.assert_called_once()
diff --git a/tests/metagpt/roles/test_tutorial_assistant.py b/tests/metagpt/roles/test_tutorial_assistant.py
index c12c2b26ec..732f346fd0 100644
--- a/tests/metagpt/roles/test_tutorial_assistant.py
+++ b/tests/metagpt/roles/test_tutorial_assistant.py
@@ -6,11 +6,11 @@
 @File    : test_tutorial_assistant.py
 """
 
-import aiofiles
 import pytest
 
 from metagpt.const import TUTORIAL_PATH
 from metagpt.roles.tutorial_assistant import TutorialAssistant
+from metagpt.utils.common import aread
 
 
 @pytest.mark.asyncio
@@ -20,9 +20,8 @@ async def test_tutorial_assistant(language: str, topic: str, context):
     msg = await role.run(topic)
     assert TUTORIAL_PATH.exists()
     filename = msg.content
-    async with aiofiles.open(filename, mode="r", encoding="utf-8") as reader:
-        content = await reader.read()
-        assert "pip" in content
+    content = await aread(filename=filename)
+    assert "pip" in content
 
 
 if __name__ == "__main__":
diff --git a/tests/metagpt/serialize_deserialize/test_team.py b/tests/metagpt/serialize_deserialize/test_team.py
index dbd38422d9..6312e1fde4 100644
--- a/tests/metagpt/serialize_deserialize/test_team.py
+++ b/tests/metagpt/serialize_deserialize/test_team.py
@@ -8,6 +8,7 @@
 
 import pytest
 
+from metagpt.context import Context
 from metagpt.logs import logger
 from metagpt.roles import Architect, ProductManager, ProjectManager
 from metagpt.team import Team
@@ -146,5 +147,21 @@ async def test_team_recover_multi_roles_save(mocker, context):
     await new_company.run(n_round=4)
 
 
+@pytest.mark.asyncio
+async def test_context(context):
+    context.kwargs.set("a", "a")
+    context.cost_manager.max_budget = 9
+    company = Team(context=context)
+
+    save_to = context.repo.workdir / "serial"
+    company.serialize(save_to)
+
+    company.deserialize(save_to, Context())
+    assert company.env.context.repo
+    assert company.env.context.repo.workdir == context.repo.workdir
+    assert company.env.context.kwargs.a == "a"
+    assert company.env.context.cost_manager.max_budget == context.cost_manager.max_budget
+
+
 if __name__ == "__main__":
     pytest.main([__file__, "-s"])
diff --git a/tests/metagpt/test_environment.py b/tests/metagpt/test_environment.py
index 7559655d36..388e495b6e 100644
--- a/tests/metagpt/test_environment.py
+++ b/tests/metagpt/test_environment.py
@@ -29,7 +29,7 @@ def test_add_role(env: Environment):
         name="Alice", profile="product manager", goal="create a new product", constraints="limited resources"
     )
     env.add_role(role)
-    assert env.get_role(role.profile) == role
+    assert env.get_role(str(role._setting)) == role
 
 
 def test_get_roles(env: Environment):
diff --git a/tests/metagpt/tools/libs/test_web_scraping.py b/tests/metagpt/tools/libs/test_web_scraping.py
index c11960e681..3d8877b8df 100644
--- a/tests/metagpt/tools/libs/test_web_scraping.py
+++ b/tests/metagpt/tools/libs/test_web_scraping.py
@@ -4,8 +4,8 @@
 
 
 @pytest.mark.asyncio
-async def test_scrape_web_playwright():
-    test_url = "https://www.deepwisdom.ai"
+async def test_scrape_web_playwright(http_server):
+    server, test_url = await http_server()
 
     result = await scrape_web_playwright(test_url)
 
@@ -21,3 +21,4 @@ async def test_scrape_web_playwright():
     assert not result["inner_text"].endswith(" ")
     assert not result["html"].startswith(" ")
     assert not result["html"].endswith(" ")
+    await server.stop()
diff --git a/tests/metagpt/tools/test_search_engine.py b/tests/metagpt/tools/test_search_engine.py
index a1f03ef7bd..498d3974d7 100644
--- a/tests/metagpt/tools/test_search_engine.py
+++ b/tests/metagpt/tools/test_search_engine.py
@@ -11,7 +11,6 @@
 
 import pytest
 
-from metagpt.config2 import config
 from metagpt.configs.search_config import SearchConfig
 from metagpt.logs import logger
 from metagpt.tools import SearchEngineType
@@ -38,6 +37,7 @@ async def run(self, query: str, max_results: int = 8, as_string: bool = True) ->
         (SearchEngineType.SERPER_GOOGLE, None, 6, False),
         (SearchEngineType.DUCK_DUCK_GO, None, 8, True),
         (SearchEngineType.DUCK_DUCK_GO, None, 6, False),
+        (SearchEngineType.BING, None, 6, False),
         (SearchEngineType.CUSTOM_ENGINE, MockSearchEnine().run, 8, False),
         (SearchEngineType.CUSTOM_ENGINE, MockSearchEnine().run, 6, False),
     ],
@@ -53,14 +53,11 @@ async def test_search_engine(
     search_engine_config = {"engine": search_engine_type, "run_func": run_func}
 
     if search_engine_type is SearchEngineType.SERPAPI_GOOGLE:
-        assert config.search
         search_engine_config["api_key"] = "mock-serpapi-key"
     elif search_engine_type is SearchEngineType.DIRECT_GOOGLE:
-        assert config.search
         search_engine_config["api_key"] = "mock-google-key"
         search_engine_config["cse_id"] = "mock-google-cse"
     elif search_engine_type is SearchEngineType.SERPER_GOOGLE:
-        assert config.search
         search_engine_config["api_key"] = "mock-serper-key"
 
     async def test(search_engine):
diff --git a/tests/metagpt/tools/test_web_browser_engine.py b/tests/metagpt/tools/test_web_browser_engine.py
index ceebd67fc3..7a344e0ade 100644
--- a/tests/metagpt/tools/test_web_browser_engine.py
+++ b/tests/metagpt/tools/test_web_browser_engine.py
@@ -9,14 +9,16 @@
 
 @pytest.mark.asyncio
 @pytest.mark.parametrize(
-    "browser_type, url, urls",
+    "browser_type",
     [
-        (WebBrowserEngineType.PLAYWRIGHT, "https://deepwisdom.ai", ("https://deepwisdom.ai",)),
-        (WebBrowserEngineType.SELENIUM, "https://deepwisdom.ai", ("https://deepwisdom.ai",)),
+        WebBrowserEngineType.PLAYWRIGHT,
+        WebBrowserEngineType.SELENIUM,
     ],
     ids=["playwright", "selenium"],
 )
-async def test_scrape_web_page(browser_type, url, urls):
+async def test_scrape_web_page(browser_type, http_server):
+    server, url = await http_server()
+    urls = [url, url, url]
     browser = web_browser_engine.WebBrowserEngine(engine=browser_type)
     result = await browser.run(url)
     assert isinstance(result, WebPage)
@@ -27,6 +29,7 @@ async def test_scrape_web_page(browser_type, url, urls):
         assert isinstance(results, list)
         assert len(results) == len(urls) + 1
         assert all(("MetaGPT" in i.inner_text) for i in results)
+    await server.stop()
 
 
 if __name__ == "__main__":
diff --git a/tests/metagpt/tools/test_web_browser_engine_playwright.py b/tests/metagpt/tools/test_web_browser_engine_playwright.py
index f35848cf45..12ea96d7b7 100644
--- a/tests/metagpt/tools/test_web_browser_engine_playwright.py
+++ b/tests/metagpt/tools/test_web_browser_engine_playwright.py
@@ -9,18 +9,28 @@
 
 @pytest.mark.asyncio
 @pytest.mark.parametrize(
-    "browser_type, use_proxy, kwagrs, url, urls",
+    "browser_type, use_proxy, kwagrs,",
     [
-        ("chromium", {"proxy": True}, {}, "https://www.deepwisdom.ai", ("https://www.deepwisdom.ai",)),
-        ("firefox", {}, {"ignore_https_errors": True}, "https://www.deepwisdom.ai", ("https://www.deepwisdom.ai",)),
-        ("webkit", {}, {"ignore_https_errors": True}, "https://www.deepwisdom.ai", ("https://www.deepwisdom.ai",)),
+        ("chromium", {"proxy": True}, {}),
+        (
+            "firefox",
+            {},
+            {"ignore_https_errors": True},
+        ),
+        (
+            "webkit",
+            {},
+            {"ignore_https_errors": True},
+        ),
     ],
     ids=["chromium-normal", "firefox-normal", "webkit-normal"],
 )
-async def test_scrape_web_page(browser_type, use_proxy, kwagrs, url, urls, proxy, capfd):
+async def test_scrape_web_page(browser_type, use_proxy, kwagrs, proxy, capfd, http_server):
+    server, url = await http_server()
+    urls = [url, url, url]
     proxy_url = None
     if use_proxy:
-        server, proxy_url = await proxy()
+        proxy_server, proxy_url = await proxy()
     browser = web_browser_engine_playwright.PlaywrightWrapper(browser_type=browser_type, proxy=proxy_url, **kwagrs)
     result = await browser.run(url)
     assert isinstance(result, WebPage)
@@ -32,8 +42,10 @@ async def test_scrape_web_page(browser_type, use_proxy, kwagrs, url, urls, proxy
         assert len(results) == len(urls) + 1
         assert all(("MetaGPT" in i.inner_text) for i in results)
     if use_proxy:
-        server.close()
+        proxy_server.close()
+        await proxy_server.wait_closed()
         assert "Proxy:" in capfd.readouterr().out
+    await server.stop()
 
 
 if __name__ == "__main__":
diff --git a/tests/metagpt/tools/test_web_browser_engine_selenium.py b/tests/metagpt/tools/test_web_browser_engine_selenium.py
index a88a5d0f40..a214748bd9 100644
--- a/tests/metagpt/tools/test_web_browser_engine_selenium.py
+++ b/tests/metagpt/tools/test_web_browser_engine_selenium.py
@@ -1,6 +1,7 @@
 #!/usr/bin/env python
 # -*- coding: utf-8 -*-
 
+
 import browsers
 import pytest
 
@@ -10,51 +11,48 @@
 
 @pytest.mark.asyncio
 @pytest.mark.parametrize(
-    "browser_type, use_proxy, url, urls",
+    "browser_type, use_proxy,",
     [
         pytest.param(
             "chrome",
-            True,
-            "https://deepwisdom.ai",
-            ("https://deepwisdom.ai",),
+            False,
             marks=pytest.mark.skipif(not browsers.get("chrome"), reason="chrome browser not found"),
         ),
         pytest.param(
             "firefox",
             False,
-            "https://deepwisdom.ai",
-            ("https://deepwisdom.ai",),
             marks=pytest.mark.skipif(not browsers.get("firefox"), reason="firefox browser not found"),
         ),
         pytest.param(
             "edge",
             False,
-            "https://deepwisdom.ai",
-            ("https://deepwisdom.ai",),
             marks=pytest.mark.skipif(not browsers.get("msedge"), reason="edge browser not found"),
         ),
     ],
     ids=["chrome-normal", "firefox-normal", "edge-normal"],
 )
-async def test_scrape_web_page(browser_type, use_proxy, url, urls, proxy, capfd):
+async def test_scrape_web_page(browser_type, use_proxy, proxy, capfd, http_server):
     # Prerequisites
     # firefox, chrome, Microsoft Edge
+    server, url = await http_server()
+    urls = [url, url, url]
     proxy_url = None
     if use_proxy:
-        server, proxy_url = await proxy()
+        proxy_server, proxy_url = await proxy()
     browser = web_browser_engine_selenium.SeleniumWrapper(browser_type=browser_type, proxy=proxy_url)
     result = await browser.run(url)
     assert isinstance(result, WebPage)
     assert "MetaGPT" in result.inner_text
 
-    if urls:
-        results = await browser.run(url, *urls)
-        assert isinstance(results, list)
-        assert len(results) == len(urls) + 1
-        assert all(("MetaGPT" in i.inner_text) for i in results)
+    results = await browser.run(url, *urls)
+    assert isinstance(results, list)
+    assert len(results) == len(urls) + 1
+    assert all(("MetaGPT" in i.inner_text) for i in results)
     if use_proxy:
-        server.close()
-        assert "Proxy:" in capfd.readouterr().out
+        proxy_server.close()
+        await proxy_server.wait_closed()
+        assert "Proxy: localhost" in capfd.readouterr().out
+    await server.stop()
 
 
 if __name__ == "__main__":
diff --git a/tests/metagpt/utils/test_common.py b/tests/metagpt/utils/test_common.py
index b365f424fa..75e8ef4adb 100644
--- a/tests/metagpt/utils/test_common.py
+++ b/tests/metagpt/utils/test_common.py
@@ -13,7 +13,6 @@
 from pathlib import Path
 from typing import Any, Set
 
-import aiofiles
 import pytest
 from pydantic import BaseModel
 
@@ -125,9 +124,7 @@ class Input(BaseModel):
     async def test_parse_data_exception(self, filename, want):
         pathname = Path(__file__).parent.parent.parent / "data/output_parser" / filename
         assert pathname.exists()
-        async with aiofiles.open(str(pathname), mode="r") as reader:
-            data = await reader.read()
-
+        data = await aread(filename=pathname)
         result = OutputParser.parse_data(data=data)
         assert want in result
 
@@ -198,12 +195,25 @@ async def test_read_file_block(self):
 
     @pytest.mark.asyncio
     async def test_read_write(self):
-        pathname = Path(__file__).parent / uuid.uuid4().hex / "test.tmp"
+        pathname = Path(__file__).parent / f"../../../workspace/unittest/{uuid.uuid4().hex}" / "test.tmp"
         await awrite(pathname, "ABC")
         data = await aread(pathname)
         assert data == "ABC"
         pathname.unlink(missing_ok=True)
 
+    @pytest.mark.asyncio
+    async def test_read_write_error_charset(self):
+        pathname = Path(__file__).parent / f"../../../workspace/unittest/{uuid.uuid4().hex}" / "test.txt"
+        content = "中国abc123\u27f6"
+        await awrite(filename=pathname, data=content)
+        data = await aread(filename=pathname)
+        assert data == content
+
+        content = "GB18030 是中国国家标准局发布的新一代中文字符集标准，是 GBK 的升级版，支持更广泛的字符范围。"
+        await awrite(filename=pathname, data=content, encoding="gb2312")
+        data = await aread(filename=pathname, encoding="utf-8")
+        assert data == content
+
 
 if __name__ == "__main__":
     pytest.main([__file__, "-s"])
diff --git a/tests/metagpt/utils/test_git_repository.py b/tests/metagpt/utils/test_git_repository.py
index ea28b8f0b8..480a22e24e 100644
--- a/tests/metagpt/utils/test_git_repository.py
+++ b/tests/metagpt/utils/test_git_repository.py
@@ -10,15 +10,14 @@
 import shutil
 from pathlib import Path
 
-import aiofiles
 import pytest
 
+from metagpt.utils.common import awrite
 from metagpt.utils.git_repository import GitRepository
 
 
 async def mock_file(filename, content=""):
-    async with aiofiles.open(str(filename), mode="w") as file:
-        await file.write(content)
+    await awrite(filename=filename, data=content)
 
 
 async def mock_repo(local_path) -> (GitRepository, Path):
diff --git a/tests/metagpt/utils/test_repo_to_markdown.py b/tests/metagpt/utils/test_repo_to_markdown.py
new file mode 100644
index 0000000000..914c50dd7c
--- /dev/null
+++ b/tests/metagpt/utils/test_repo_to_markdown.py
@@ -0,0 +1,25 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+import uuid
+from pathlib import Path
+
+import pytest
+
+from metagpt.utils.repo_to_markdown import repo_to_markdown
+
+
+@pytest.mark.parametrize(
+    ["repo_path", "output"],
+    [(Path(__file__).parent.parent, Path(__file__).parent.parent.parent / f"workspace/unittest/{uuid.uuid4().hex}.md")],
+)
+@pytest.mark.asyncio
+async def test_repo_to_markdown(repo_path: Path, output: Path):
+    markdown = await repo_to_markdown(repo_path=repo_path, output=output)
+    assert output.exists()
+    assert markdown
+
+    output.unlink(missing_ok=True)
+
+
+if __name__ == "__main__":
+    pytest.main([__file__, "-s"])
diff --git a/tests/metagpt/utils/test_s3.py b/tests/metagpt/utils/test_s3.py
index 34c21612cb..ef13c23255 100644
--- a/tests/metagpt/utils/test_s3.py
+++ b/tests/metagpt/utils/test_s3.py
@@ -9,7 +9,6 @@
 from pathlib import Path
 
 import aioboto3
-import aiofiles
 import pytest
 
 from metagpt.config2 import Config
@@ -46,7 +45,7 @@ async def test_s3(mocker):
     conn = S3(s3)
     object_name = "unittest.bak"
     await conn.upload_file(bucket=s3.bucket, local_path=__file__, object_name=object_name)
-    pathname = (Path(__file__).parent / uuid.uuid4().hex).with_suffix(".bak")
+    pathname = (Path(__file__).parent / "../../../workspace/unittest" / uuid.uuid4().hex).with_suffix(".bak")
     pathname.unlink(missing_ok=True)
     await conn.download_file(bucket=s3.bucket, object_name=object_name, local_path=str(pathname))
     assert pathname.exists()
@@ -54,8 +53,7 @@ async def test_s3(mocker):
     assert url
     bin_data = await conn.get_object(bucket=s3.bucket, object_name=object_name)
     assert bin_data
-    async with aiofiles.open(__file__, mode="r", encoding="utf-8") as reader:
-        data = await reader.read()
+    data = await aread(filename=__file__)
     res = await conn.cache(data, ".bak", "script")
     assert "http" in res
 
@@ -69,8 +67,6 @@ async def test_s3(mocker):
     except Exception:
         pass
 
-    await reader.close()
-
 
 if __name__ == "__main__":
     pytest.main([__file__, "-s"])
diff --git a/tests/metagpt/utils/test_text.py b/tests/metagpt/utils/test_text.py
index c9a9753be4..319a4ebe01 100644
--- a/tests/metagpt/utils/test_text.py
+++ b/tests/metagpt/utils/test_text.py
@@ -22,7 +22,7 @@ def _paragraphs(n):
 @pytest.mark.parametrize(
     "msgs, model_name, system_text, reserved, expected",
     [
-        (_msgs(), "gpt-3.5-turbo", "System", 1500, 1),
+        (_msgs(), "gpt-3.5-turbo-0613", "System", 1500, 1),
         (_msgs(), "gpt-3.5-turbo-16k", "System", 3000, 6),
         (_msgs(), "gpt-3.5-turbo-16k", "Hello," * 1000, 3000, 5),
         (_msgs(), "gpt-4", "System", 2000, 3),
@@ -32,22 +32,23 @@ def _paragraphs(n):
     ],
 )
 def test_reduce_message_length(msgs, model_name, system_text, reserved, expected):
-    assert len(reduce_message_length(msgs, model_name, system_text, reserved)) / (len("Hello,")) / 1000 == expected
+    length = len(reduce_message_length(msgs, model_name, system_text, reserved)) / (len("Hello,")) / 1000
+    assert length == expected
 
 
 @pytest.mark.parametrize(
     "text, prompt_template, model_name, system_text, reserved, expected",
     [
-        (" ".join("Hello World." for _ in range(1000)), "Prompt: {}", "gpt-3.5-turbo", "System", 1500, 2),
+        (" ".join("Hello World." for _ in range(1000)), "Prompt: {}", "gpt-3.5-turbo-0613", "System", 1500, 2),
         (" ".join("Hello World." for _ in range(1000)), "Prompt: {}", "gpt-3.5-turbo-16k", "System", 3000, 1),
         (" ".join("Hello World." for _ in range(4000)), "Prompt: {}", "gpt-4", "System", 2000, 2),
         (" ".join("Hello World." for _ in range(8000)), "Prompt: {}", "gpt-4-32k", "System", 4000, 1),
-        (" ".join("Hello World" for _ in range(8000)), "Prompt: {}", "gpt-3.5-turbo", "System", 1000, 8),
+        (" ".join("Hello World" for _ in range(8000)), "Prompt: {}", "gpt-3.5-turbo-0613", "System", 1000, 8),
     ],
 )
 def test_generate_prompt_chunk(text, prompt_template, model_name, system_text, reserved, expected):
-    ret = list(generate_prompt_chunk(text, prompt_template, model_name, system_text, reserved))
-    assert len(ret) == expected
+    chunk = len(list(generate_prompt_chunk(text, prompt_template, model_name, system_text, reserved)))
+    assert chunk == expected
 
 
 @pytest.mark.parametrize(
diff --git a/tests/metagpt/utils/test_tree.py b/tests/metagpt/utils/test_tree.py
new file mode 100644
index 0000000000..03a2a56069
--- /dev/null
+++ b/tests/metagpt/utils/test_tree.py
@@ -0,0 +1,64 @@
+from pathlib import Path
+from typing import List
+
+import pytest
+
+from metagpt.utils.tree import _print_tree, tree
+
+
+@pytest.mark.parametrize(
+    ("root", "rules"),
+    [
+        (str(Path(__file__).parent / "../.."), None),
+        (str(Path(__file__).parent / "../.."), str(Path(__file__).parent / "../../../.gitignore")),
+    ],
+)
+def test_tree(root: str, rules: str):
+    v = tree(root=root, gitignore=rules)
+    assert v
+
+
+@pytest.mark.parametrize(
+    ("root", "rules"),
+    [
+        (str(Path(__file__).parent / "../.."), None),
+        (str(Path(__file__).parent / "../.."), str(Path(__file__).parent / "../../../.gitignore")),
+    ],
+)
+def test_tree_command(root: str, rules: str):
+    v = tree(root=root, gitignore=rules, run_command=True)
+    assert v
+
+
+@pytest.mark.parametrize(
+    ("tree", "want"),
+    [
+        ({"a": {"b": {}, "c": {}}}, ["a", "+-- b", "+-- c"]),
+        ({"a": {"b": {}, "c": {"d": {}}}}, ["a", "+-- b", "+-- c", "    +-- d"]),
+        (
+            {"a": {"b": {"e": {"f": {}, "g": {}}}, "c": {"d": {}}}},
+            ["a", "+-- b", "|   +-- e", "|       +-- f", "|       +-- g", "+-- c", "    +-- d"],
+        ),
+        (
+            {"h": {"a": {"b": {"e": {"f": {}, "g": {}}}, "c": {"d": {}}}, "i": {}}},
+            [
+                "h",
+                "+-- a",
+                "|   +-- b",
+                "|   |   +-- e",
+                "|   |       +-- f",
+                "|   |       +-- g",
+                "|   +-- c",
+                "|       +-- d",
+                "+-- i",
+            ],
+        ),
+    ],
+)
+def test__print_tree(tree: dict, want: List[str]):
+    v = _print_tree(tree)
+    assert v == want
+
+
+if __name__ == "__main__":
+    pytest.main([__file__, "-s"])
diff --git a/tests/mock/mock_llm.py b/tests/mock/mock_llm.py
index b4cdfa0cfd..c4262e0806 100644
--- a/tests/mock/mock_llm.py
+++ b/tests/mock/mock_llm.py
@@ -8,7 +8,6 @@
 from metagpt.provider.constant import GENERAL_FUNCTION_SCHEMA
 from metagpt.provider.openai_api import OpenAILLM
 from metagpt.schema import Message
-from metagpt.utils.common import process_message
 
 OriginalLLM = OpenAILLM if config.llm.api_type == LLMType.OPENAI else AzureOpenAILLM
 
@@ -105,7 +104,7 @@ async def aask_batch(self, msgs: list, timeout=3) -> str:
         return rsp
 
     async def aask_code(self, messages: Union[str, Message, list[dict]], **kwargs) -> dict:
-        msg_key = json.dumps(process_message(messages), ensure_ascii=False)
+        msg_key = json.dumps(self.format_msg(messages), ensure_ascii=False)
         rsp = await self._mock_rsp(msg_key, self.original_aask_code, messages, **kwargs)
         return rsp