diff --git a/.gitattributes b/.gitattributes
index 7f1424434..865da2ca2 100644
--- a/.gitattributes
+++ b/.gitattributes
@@ -12,6 +12,11 @@
 *.jpg binary
 *.gif binary
 *.ico binary
+*.jpeg binary
+*.mp3 binary
+*.zip binary
+*.bin binary
+
 
 # Preserve original line endings for specific document files
 *.doc text eol=crlf
diff --git a/.github/ISSUE_TEMPLATE/show_me_the_bug.md b/.github/ISSUE_TEMPLATE/show_me_the_bug.md
index 504a2bd12..0c33f0319 100644
--- a/.github/ISSUE_TEMPLATE/show_me_the_bug.md
+++ b/.github/ISSUE_TEMPLATE/show_me_the_bug.md
@@ -19,6 +19,7 @@
 - LLM type and model name:
 - System version:
 - Python version:
+- MetaGPT version or branch:
 
 <!-- Dependent packagess：the packages version cause the bug(like `pydantic 1.10.8`), installation method（like `pip install metagpt` or `pip install from source` or `run in docker`） -->
 
diff --git a/.github/workflows/build-package.yaml b/.github/workflows/build-package.yaml
index 7f4fee53e..294a13f71 100644
--- a/.github/workflows/build-package.yaml
+++ b/.github/workflows/build-package.yaml
@@ -1,8 +1,9 @@
 name: Build and upload python package
 
 on:
+  workflow_dispatch:
   release:
-    types: [created]
+    types: [created, published]
 
 jobs:
   deploy:
diff --git a/.gitignore b/.gitignore
index 6bc67fa61..aa5edd74a 100644
--- a/.gitignore
+++ b/.gitignore
@@ -1,7 +1,7 @@
 ### Python template
 
 # Byte-compiled / optimized / DLL files
-__pycache__/
+__pycache__
 *.py[cod]
 *$py.class
 
@@ -27,6 +27,8 @@ share/python-wheels/
 .installed.cfg
 *.egg
 MANIFEST
+metagpt/tools/schemas/
+examples/data/search_kb/*.json
 
 # PyInstaller
 #  Usually these files are written by a python scripts from a template
@@ -151,9 +153,14 @@ allure-results
 .vscode
 
 key.yaml
-data
+/data/
 data.ms
 examples/nb/
+examples/default__vector_store.json
+examples/docstore.json
+examples/graph_store.json
+examples/image__vector_store.json
+examples/index_store.json
 .chroma
 *~$*
 workspace/*
@@ -168,6 +175,7 @@ output
 tmp.png
 .dependencies.json
 tests/metagpt/utils/file_repo_git
+tests/data/rsp_cache_new.json
 *.tmp
 *.png
 htmlcov
@@ -178,4 +186,5 @@ cov.xml
 *.faiss
 *-structure.csv
 *-structure.json
-metagpt/tools/schemas
\ No newline at end of file
+*.dot
+.python-version
diff --git a/MANIFEST.in b/MANIFEST.in
new file mode 100644
index 000000000..292433f80
--- /dev/null
+++ b/MANIFEST.in
@@ -0,0 +1,3 @@
+recursive-include metagpt/ext/stanford_town/prompts *.txt
+recursive-include metagpt/ext/stanford_town/static_dirs *.csv
+recursive-include metagpt/ext/stanford_town/static_dirs *.json
\ No newline at end of file
diff --git a/README.md b/README.md
index 72ce03412..edb2066a3 100644
--- a/README.md
+++ b/README.md
@@ -26,7 +26,7 @@ # MetaGPT: The Multi-Agent Framework
 </p>
 
 ## News
-🚀 March. 01, 2024: Our Data Interpreter paper is on arxiv. Find all design and benchmark details [here](https://arxiv.org/abs/2402.18679)!
+🚀 Mar. 14, 2024: Our **Data Interpreter** paper is on [arxiv](https://arxiv.org/abs/2402.18679). Check the [example](https://docs.deepwisdom.ai/main/en/DataInterpreter/) and [code](https://github.com/geekan/MetaGPT/tree/main/examples/di)!
 
 🚀 Feb. 08, 2024: [v0.7.0](https://github.com/geekan/MetaGPT/releases/tag/v0.7.0) released, supporting assigning different LLMs to different Roles. We also introduced [Data Interpreter](https://github.com/geekan/MetaGPT/blob/main/examples/di/README.md), a powerful agent capable of solving a wide range of real-world problems.
 
@@ -55,21 +55,30 @@ ## Software Company as Multi-Agent System
 
 <p align="center">Software Company Multi-Agent Schematic (Gradually Implementing)</p>
 
-## Install
+## Get Started
 
-### Pip installation
+### Installation
 
 > Ensure that Python 3.9+ is installed on your system. You can check this by using: `python --version`.  
 > You can use conda like this: `conda create -n metagpt python=3.9 && conda activate metagpt`
 
 ```bash
-pip install metagpt
-# https://docs.deepwisdom.ai/main/en/guide/get_started/configuration.html
-metagpt --init-config  # it will create ~/.metagpt/config2.yaml, just modify it to your needs
+pip install --upgrade metagpt
+# or `pip install --upgrade git+https://github.com/geekan/MetaGPT.git`
+# or `git clone https://github.com/geekan/MetaGPT && cd MetaGPT && pip install --upgrade -e .`
 ```
 
+For detailed installation guidance, please refer to [cli_install](https://docs.deepwisdom.ai/main/en/guide/get_started/installation.html#install-stable-version)
+ or [docker_install](https://docs.deepwisdom.ai/main/en/guide/get_started/installation.html#install-with-docker)
+
 ### Configuration
 
+You can init the config of MetaGPT by running the following command, or manually create `~/.metagpt/config2.yaml` file:
+```bash
+# Check https://docs.deepwisdom.ai/main/en/guide/get_started/configuration.html for more details
+metagpt --init-config  # it will create ~/.metagpt/config2.yaml, just modify it to your needs
+```
+
 You can configure `~/.metagpt/config2.yaml` according to the [example](https://github.com/geekan/MetaGPT/blob/main/config/config2.example.yaml) and [doc](https://docs.deepwisdom.ai/main/en/guide/get_started/configuration.html):
 
 ```yaml
@@ -82,13 +91,13 @@ ### Configuration
 
 ### Usage
 
-After installation, you can use it as CLI
+After installation, you can use MetaGPT at CLI
 
 ```bash
 metagpt "Create a 2048 game"  # this will create a repo in ./workspace
 ```
 
-or you can use it as library
+or use it as library
 
 ```python
 from metagpt.software_company import generate_repo, ProjectRepo
@@ -96,47 +105,19 @@ ### Usage
 print(repo)  # it will print the repo structure with files
 ```
 
-detail installation please refer to [cli_install](https://docs.deepwisdom.ai/main/en/guide/get_started/installation.html#install-stable-version)
- or [docker_install](https://docs.deepwisdom.ai/main/en/guide/get_started/installation.html#install-with-docker)
+You can also use its [Data Interpreter](https://github.com/geekan/MetaGPT/tree/main/examples/di)
 
-### Docker installation
-<details><summary><strong>⏬ Step 1: Download metagpt image and prepare config2.yaml </strong><i>:: click to expand ::</i></summary>
-<div>
+```python
+import asyncio
+from metagpt.roles.di.data_interpreter import DataInterpreter
 
-```bash
-docker pull metagpt/metagpt:latest
-mkdir -p /opt/metagpt/{config,workspace}
-docker run --rm metagpt/metagpt:latest cat /app/metagpt/config/config2.yaml > /opt/metagpt/config/config2.yaml
-vim /opt/metagpt/config/config2.yaml # Change the config
+async def main():
+    di = DataInterpreter()
+    await di.run("Run data analysis on sklearn Iris dataset, include a plot")
+
+asyncio.run(main())  # or await main() in a jupyter notebook setting
 ```
 
-</div>
-</details>
-
-<details><summary><strong>⏬ Step 2: Run metagpt container </strong><i>:: click to expand ::</i></summary>
-<div>
-
-```bash
-docker run --name metagpt -d \
-    --privileged \
-    -v /opt/metagpt/config/config2.yaml:/app/metagpt/config/config2.yaml \
-    -v /opt/metagpt/workspace:/app/metagpt/workspace \
-    metagpt/metagpt:latest
-```
-
-</div>
-</details>
-
-<details><summary><strong>⏬ Step 3: Use metagpt </strong><i>:: click to expand ::</i></summary>
-<div>
-
-```bash
-docker exec -it metagpt /bin/bash
-$ metagpt "Create a 2048 game"  # this will create a repo in ./workspace
-```
-
-</div>
-</details>
 
 ### QuickStart & Demo Video
 - Try it on [MetaGPT Huggingface Space](https://huggingface.co/spaces/deepwisdom/MetaGPT)
@@ -156,6 +137,7 @@ ## Tutorial
 - 🧑‍💻 Contribution
   - [Develop Roadmap](docs/ROADMAP.md)
 - 🔖 Use Cases
+  - [Data Interpreter](https://docs.deepwisdom.ai/main/en/guide/use_cases/agent/interpreter/intro.html)
   - [Debate](https://docs.deepwisdom.ai/main/en/guide/use_cases/multi_agent/debate.html)
   - [Researcher](https://docs.deepwisdom.ai/main/en/guide/use_cases/agent/researcher.html)
   - [Recepit Assistant](https://docs.deepwisdom.ai/main/en/guide/use_cases/agent/receipt_assistant.html)
@@ -179,7 +161,9 @@ ### Contact Information
 
 ## Citation
 
-For now, cite the [arXiv paper](https://arxiv.org/abs/2308.00352):
+To stay updated with the latest research and development, follow [@MetaGPT_](https://twitter.com/MetaGPT_) on Twitter. 
+
+To cite [MetaGPT](https://arxiv.org/abs/2308.00352) or [Data Interpreter](https://arxiv.org/abs/2402.18679) in publications, please use the following BibTeX entries.
 
 ```bibtex
 @misc{hong2023metagpt,
@@ -190,4 +174,14 @@ ## Citation
       archivePrefix={arXiv},
       primaryClass={cs.AI}
 }
+@misc{hong2024data,
+      title={Data Interpreter: An LLM Agent For Data Science}, 
+      author={Sirui Hong and Yizhang Lin and Bang Liu and Bangbang Liu and Binhao Wu and Danyang Li and Jiaqi Chen and Jiayi Zhang and Jinlin Wang and Li Zhang and Lingyao Zhang and Min Yang and Mingchen Zhuge and Taicheng Guo and Tuo Zhou and Wei Tao and Wenyi Wang and Xiangru Tang and Xiangtao Lu and Xiawu Zheng and Xinbing Liang and Yaying Fei and Yuheng Cheng and Zongze Xu and Chenglin Wu},
+      year={2024},
+      eprint={2402.18679},
+      archivePrefix={arXiv},
+      primaryClass={cs.AI}
+}
+
 ```
+
diff --git a/SECURITY.md b/SECURITY.md
index 623e6e556..924ce5015 100644
--- a/SECURITY.md
+++ b/SECURITY.md
@@ -4,9 +4,9 @@ ## Supported Versions
 
 | Version | Supported          |
 |---------|--------------------|
- | 7.x     | :x:                |
- | 6.x     | :x:                |
-| < 6.x   | :x:                |
+ | 0.7.x   | :x:                |
+ | 0.6.x   | :x:                |
+| < 0.6.x | :x:                |
 
 
 ## Reporting a Vulnerability
diff --git a/config/config2.example.yaml b/config/config2.example.yaml
index 3a5cc3585..c5454ec32 100644
--- a/config/config2.example.yaml
+++ b/config/config2.example.yaml
@@ -4,6 +4,7 @@ llm:
   api_key: "YOUR_API_KEY"
   model: "gpt-4-turbo-preview"  # or gpt-3.5-turbo-1106 / gpt-4-1106-preview
   proxy: "YOUR_PROXY"  # for LLM API requests
+  # timeout: 600 # Optional. If set to 0, default value is 300.
   pricing_plan: "" # Optional. If invalid, it will be automatically filled in with the value of the `model`.
   # Azure-exclusive pricing plan mappings：
   # - gpt-3.5-turbo 4k: "gpt-3.5-turbo-1106"
diff --git a/docs/README_CN.md b/docs/README_CN.md
index 7a0db4974..8aea5e4cb 100644
--- a/docs/README_CN.md
+++ b/docs/README_CN.md
@@ -116,7 +116,7 @@ ### 联系信息
 
 ## 引用
 
-引用 [arXiv paper](https://arxiv.org/abs/2308.00352):
+如果您在研究论文中使用 MetaGPT 或 Data Interpreter，请引用我们的工作：
 
 ```bibtex
 @misc{hong2023metagpt,
@@ -127,4 +127,12 @@ ## 引用
       archivePrefix={arXiv},
       primaryClass={cs.AI}
 }
+@misc{hong2024data,
+      title={Data Interpreter: An LLM Agent For Data Science}, 
+      author={Sirui Hong and Yizhang Lin and Bang Liu and Bangbang Liu and Binhao Wu and Danyang Li and Jiaqi Chen and Jiayi Zhang and Jinlin Wang and Li Zhang and Lingyao Zhang and Min Yang and Mingchen Zhuge and Taicheng Guo and Tuo Zhou and Wei Tao and Wenyi Wang and Xiangru Tang and Xiangtao Lu and Xiawu Zheng and Xinbing Liang and Yaying Fei and Yuheng Cheng and Zongze Xu and Chenglin Wu},
+      year={2024},
+      eprint={2402.18679},
+      archivePrefix={arXiv},
+      primaryClass={cs.AI}
+}
 ```
diff --git a/docs/README_JA.md b/docs/README_JA.md
index c6b99461c..91155532b 100644
--- a/docs/README_JA.md
+++ b/docs/README_JA.md
@@ -295,7 +295,7 @@ ## クイックスタート
 
 ## 引用
 
-現時点では、[arXiv 論文](https://arxiv.org/abs/2308.00352)を引用してください:
+研究論文でMetaGPTやData Interpreterを使用する場合は、以下のように当社の作業を引用してください：
 
 ```bibtex
 @misc{hong2023metagpt,
@@ -306,6 +306,14 @@ ## 引用
       archivePrefix={arXiv},
       primaryClass={cs.AI}
 }
+@misc{hong2024data,
+      title={Data Interpreter: An LLM Agent For Data Science}, 
+      author={Sirui Hong and Yizhang Lin and Bang Liu and Bangbang Liu and Binhao Wu and Danyang Li and Jiaqi Chen and Jiayi Zhang and Jinlin Wang and Li Zhang and Lingyao Zhang and Min Yang and Mingchen Zhuge and Taicheng Guo and Tuo Zhou and Wei Tao and Wenyi Wang and Xiangru Tang and Xiangtao Lu and Xiawu Zheng and Xinbing Liang and Yaying Fei and Yuheng Cheng and Zongze Xu and Chenglin Wu},
+      year={2024},
+      eprint={2402.18679},
+      archivePrefix={arXiv},
+      primaryClass={cs.AI}
+}
 ```
 
 ## お問い合わせ先
diff --git a/examples/data/rag/travel.txt b/examples/data/rag/travel.txt
new file mode 100644
index 000000000..f72ad5c59
--- /dev/null
+++ b/examples/data/rag/travel.txt
@@ -0,0 +1 @@
+Bob likes traveling.
\ No newline at end of file
diff --git a/examples/data/rag/writer.txt b/examples/data/rag/writer.txt
new file mode 100644
index 000000000..1dc055901
--- /dev/null
+++ b/examples/data/rag/writer.txt
@@ -0,0 +1,109 @@
+Productivity
+I think I am at least somewhat more productive than average, and people sometimes ask me for productivity tips.  So I decided to just write them all down in one place.
+
+Compound growth gets discussed as a financial concept, but it works in careers as well, and it is magic.  A small productivity gain, compounded over 50 years, is worth a lot.  So it’s worth figuring out how to optimize productivity. If you get 10% more done and 1% better every day compared to someone else, the compounded difference is massive. 
+
+What you work on
+
+Famous writers have some essential qualities, creativity and discipline
+
+It doesn’t matter how fast you move if it’s in a worthless direction.  Picking the right thing to work on is the most important element of productivity and usually almost ignored.  So think about it more!  Independent thought is hard but it’s something you can get better at with practice.
+
+The most impressive people I know have strong beliefs about the world, which is rare in the general population.  If you find yourself always agreeing with whomever you last spoke with, that’s bad.  You will of course be wrong sometimes, but develop the confidence to stick with your convictions.  It will let you be courageous when you’re right about something important that most people don’t see.
+
+I make sure to leave enough time in my schedule to think about what to work on.  The best ways for me to do this are reading books, hanging out with interesting people, and spending time in nature.
+
+I’ve learned that I can’t be very productive working on things I don’t care about or don’t like.  So I just try not to put myself in a position where I have to do them (by delegating, avoiding, or something else).  Stuff that you don’t like is a painful drag on morale and momentum.
+
+By the way, here is an important lesson about delegation: remember that everyone else is also most productive when they’re doing what they like, and do what you’d want other people to do for you—try to figure out who likes (and is good at) doing what, and delegate that way.  
+
+If you find yourself not liking what you’re doing for a long period of time, seriously consider a major job change.  Short-term burnout happens, but if it isn’t resolved with some time off, maybe it’s time to do something you’re more interested in. 
+
+I’ve been very fortunate to find work I like so much I’d do it for free, which makes it easy to be really productive.
+
+It’s important to learn that you can learn anything you want, and that you can get better quickly.  This feels like an unlikely miracle the first few times it happens, but eventually you learn to trust that you can do it.
+
+Doing great work usually requires colleagues of some sort.  Try to be around smart, productive, happy, and positive people that don’t belittle your ambitions.  I love being around people who push me and inspire me to be better.  To the degree you able to, avoid the opposite kind of people—the cost of letting them take up your mental cycles is horrific. 
+
+You have to both pick the right problem and do the work.  There aren’t many shortcuts.  If you’re going to do something really important, you are very likely going to work both smart and hard.  The biggest prizes are heavily competed for.  This isn’t true in every field (there are great mathematicians who never spend that many hours a week working) but it is in most.
+
+﻿Prioritization
+
+Writers have to work hard to be successful 
+
+My system has three key pillars: “Make sure to get the important shit done”, “Don’t waste time on stupid shit”, and “make a lot of lists”.
+
+I highly recommend using lists.  I make lists of what I want to accomplish each year, each month, and each day.  Lists are very focusing, and they help me with multitasking because I don’t have to keep as much in my head.  If I’m not in the mood for some particular task, I can always find something else I’m excited to do.
+
+I prefer lists written down on paper.  It’s easy to add and remove tasks.  I can access them during meetings without feeling rude.  I re-transcribe lists frequently, which forces me to think about everything on the list and gives me an opportunity to add and remove items.
+
+I don’t bother with categorization or trying to size tasks or anything like that (the most I do is put a star next to really important items).  
+
+I try to prioritize in a way that generates momentum.  The more I get done, the better I feel, and then the more I get done.  I like to start and end each day with something I can really make progress on.
+
+I am relentless about getting my most important projects done—I’ve found that if I really want something to happen and I push hard enough, it usually happens. 
+
+I try to be ruthless about saying no to stuff, and doing non-critical things in the quickest way possible.  I probably take this too far—for example, I am almost sure I am terse to the point of rudeness when replying to emails.
+
+Passion and adaptability are key qualities to writers
+
+I generally try to avoid meetings and conferences as I find the time cost to be huge—I get the most value out of time in my office.  However, it is critical that you keep enough space in your schedule to allow for chance encounters and exposure to new people and ideas.  Having an open network is valuable; though probably 90% of the random meetings I take are a waste of time, the other 10% really make up for it.
+
+I find most meetings are best scheduled for 15-20 minutes, or 2 hours.  The default of 1 hour is usually wrong, and leads to a lot of wasted time.
+
+I have different times of day I try to use for different kinds of work.  The first few hours of the morning are definitely my most productive time of the day, so I don’t let anyone schedule anything then.  I try to do meetings in the afternoon.  I take a break, or switch tasks, whenever I feel my attention starting to fade. 
+
+I don’t think most people value their time enough—I am surprised by the number of people I know who make $100 an hour and yet will spend a couple of hours doing something they don’t want to do to save $20.
+
+Also, don’t fall into the trap of productivity porn—chasing productivity for its own sake isn’t helpful.  Many people spend too much time thinking about how to perfectly optimize their system, and not nearly enough asking if they’re working on the right problems.  It doesn’t matter what system you use or if you squeeze out every second if you’re working on the wrong thing.
+
+The right goal is to allocate your year optimally, not your day.
+
+Physical factors
+
+Very likely what is optimal for me won’t be optimal for you.  You’ll have to experiment to find out what works best for your body.  It’s definitely worth doing—it helps in all aspects of life, and you’ll feel a lot better and happier overall.
+
+It probably took a little bit of my time every week for a few years to arrive at what works best for me, but my sense is if I do a good job at all the below I’m at least 1.5x more productive than if not.
+
+Sleep seems to be the most important physical factor in productivity for me.  Some sort of sleep tracker to figure out how to sleep best is helpful.  I’ve found the only thing I’m consistent with are in the set-it-and-forget-it category, and I really like the Emfit QS+Active.
+
+I like a cold, dark, quiet room, and a great mattress (I resisted spending a bunch of money on a great mattress for years, which was stupid—it makes a huge difference to my sleep quality.  I love this one).  Not eating a lot in the few hours before sleep helps.  Not drinking alcohol helps a lot, though I’m not willing to do that all the time.
+
+I use a Chili Pad to be cold while I sleep if I can’t get the room cold enough, which is great but loud (I set it up to have the cooler unit outside my room).
+
+When traveling, I use an eye mask and ear plugs.
+
+Writers usually have empathy to write good books.
+
+This is likely to be controversial, but I take a low dose of sleeping pills (like a third of a normal dose) or a very low dose of cannabis whenever I can’t sleep.  I am a bad sleeper in general, and a particularly bad sleeper when I travel.  It likely has tradeoffs, but so does not sleeping well.  If you can already sleep well, I wouldn’t recommend this.
+
+I use a full spectrum LED light most mornings for about 10-15 minutes while I catch up on email.  It’s great—if you try nothing else in here, this is the thing I’d try.  It’s a ridiculous gain for me.  I like this one, and it’s easy to travel with.
+
+Exercise is probably the second most important physical factor.  I tried a number of different exercise programs for a few months each and the one that seemed best was lifting heavy weights 3x a week for an hour, and high intensity interval training occasionally.  In addition to productivity gains, this is also the exercise program that makes me feel the best overall.  
+
+The third area is nutrition.  I very rarely eat breakfast, so I get about 15 hours of fasting most days (except an espresso when I wake up).  I know this is contrary to most advice, and I suspect it’s not optimal for most people, but it definitely works well for me.
+
+Eating lots of sugar is the thing that makes me feel the worst and that I try hardest to avoid.  I also try to avoid foods that aggravate my digestion or spike up inflammation (for example, very spicy foods).  I don’t have much willpower when it comes to sweet things, so I mostly just try to keep junk food out of the house.
+
+I have one big shot of espresso immediately when I wake up and one after lunch.  I assume this is about 200mg total of caffeine per day.  I tried a few other configurations; this was the one that worked by far the best.  I otherwise aggressively avoid stimulants, but I will have more coffee if I’m super tired and really need to get something done.
+
+If a writer want to be super, then should include innovative thinking.
+
+I’m vegetarian and have been since I was a kid, and I supplement methyl B-12, Omega-3, Iron, and Vitamin D-3.  I got to this list with a year or so of quarterly blood tests; it’s worked for me ever since (I re-test maybe every year and a half or so).  There are many doctors who will happily work with you on a super comprehensive blood test (and services like WellnessFX).  I also go out of my way to drink a lot of protein shakes, which I hate and I wouldn’t do if I weren’t vegetarian.
+
+﻿Other stuff
+
+Here’s what I like in a workspace: natural light, quiet, knowing that I won’t be interrupted if I don’t want to be, long blocks of time, and being comfortable and relaxed (I’ve got a beautiful desk with a couple of 4k monitors on it in my office, but I spend almost all my time on my couch with my laptop).
+
+I wrote custom software for the annoying things I have to do frequently, which is great.  I also made an effort to learn to type really fast and the keyboard shortcuts that help with my workflow.
+
+Like most people, I sometimes go through periods of a week or two where I just have no motivation to do anything (I suspect it may have something to do with nutrition).  This sucks and always seems to happen at inconvenient times.  I have not figured out what to do about it besides wait for the fog to lift, and to trust that eventually it always does.  And I generally try to avoid people and situations that put me in bad moods, which is good advice whether you care about productivity or not.
+
+In general, I think it’s good to overcommit a little bit.  I find that I generally get done what I take on, and if I have a little bit too much to do it makes me more efficient at everything, which is a way to train to avoid distractions (a great habit to build!).  However, overcommitting a lot is disastrous.
+
+Don’t neglect your family and friends for the sake of productivity—that’s a very stupid tradeoff (and very likely a net productivity loss, because you’ll be less happy).  Don’t neglect doing things you love or that clear your head either.
+
+Finally, to repeat one more time: productivity in the wrong direction isn’t worth anything at all.  Think more about what to work on.
+
+Open-Mindedness and curiosity are essential to writers
+
diff --git a/examples/example.json b/examples/data/search_kb/example.json
similarity index 100%
rename from examples/example.json
rename to examples/data/search_kb/example.json
diff --git a/examples/example.xlsx b/examples/data/search_kb/example.xlsx
similarity index 100%
rename from examples/example.xlsx
rename to examples/data/search_kb/example.xlsx
diff --git a/examples/di/arxiv_reader.py b/examples/di/arxiv_reader.py
new file mode 100644
index 000000000..6e1939b81
--- /dev/null
+++ b/examples/di/arxiv_reader.py
@@ -0,0 +1,21 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+from metagpt.roles.di.data_interpreter import DataInterpreter
+
+
+async def main():
+    template = "https://arxiv.org/list/{tag}/pastweek?skip=0&show=300"
+    tags = ["cs.ai", "cs.cl", "cs.lg", "cs.se"]
+    urls = [template.format(tag=tag) for tag in tags]
+    prompt = f"""This is a collection of arxiv urls: '{urls}' .
+Record each article, remove duplicates by title (they may have multiple tags), filter out papers related to 
+large language model / agent / llm, print top 100 and visualize the word count of the titles"""
+    di = DataInterpreter(react_mode="react", tools=["scrape_web_playwright"])
+
+    await di.run(prompt)
+
+
+if __name__ == "__main__":
+    import asyncio
+
+    asyncio.run(main())
diff --git a/examples/di/custom_tool.py b/examples/di/custom_tool.py
new file mode 100644
index 000000000..cbe7380c7
--- /dev/null
+++ b/examples/di/custom_tool.py
@@ -0,0 +1,36 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+"""
+@Time    : 2024/3/22 10:54
+@Author  : alexanderwu
+@File    : custom_tool.py
+"""
+
+from metagpt.roles.di.data_interpreter import DataInterpreter
+from metagpt.tools.tool_registry import register_tool
+
+
+@register_tool()
+def magic_function(arg1: str, arg2: int) -> dict:
+    """
+    The magic function that does something.
+
+    Args:
+        arg1 (str): ...
+        arg2 (int): ...
+
+    Returns:
+        dict: ...
+    """
+    return {"arg1": arg1 * 3, "arg2": arg2 * 5}
+
+
+async def main():
+    di = DataInterpreter(tools=["magic_function"])
+    await di.run("Just call the magic function with arg1 'A' and arg2 2. Tell me the result.")
+
+
+if __name__ == "__main__":
+    import asyncio
+
+    asyncio.run(main())
diff --git a/examples/di/data_visualization.py b/examples/di/data_visualization.py
index 1a21ab7cb..184e04f26 100644
--- a/examples/di/data_visualization.py
+++ b/examples/di/data_visualization.py
@@ -1,14 +1,17 @@
 import asyncio
 
+from metagpt.logs import logger
 from metagpt.roles.di.data_interpreter import DataInterpreter
+from metagpt.utils.recovery_util import save_history
 
 
 async def main(requirement: str = ""):
     di = DataInterpreter()
-    await di.run(requirement)
+    rsp = await di.run(requirement)
+    logger.info(rsp)
+    save_history(role=di)
 
 
 if __name__ == "__main__":
     requirement = "Run data analysis on sklearn Iris dataset, include a plot"
-
     asyncio.run(main(requirement))
diff --git a/examples/di/machine_learning.py b/examples/di/machine_learning.py
index a58735831..c674e66e8 100644
--- a/examples/di/machine_learning.py
+++ b/examples/di/machine_learning.py
@@ -2,11 +2,21 @@ import fire
 
 from metagpt.roles.di.data_interpreter import DataInterpreter
 
+WINE_REQ = "Run data analysis on sklearn Wine recognition dataset, include a plot, and train a model to predict wine class (20% as validation), and show validation accuracy."
 
-async def main(auto_run: bool = True):
-    requirement = "Run data analysis on sklearn Wine recognition dataset, include a plot, and train a model to predict wine class (20% as validation), and show validation accuracy."
-    di = DataInterpreter(auto_run=auto_run)
-    await di.run(requirement)
+DATA_DIR = "path/to/your/data"
+# sales_forecast data from https://www.kaggle.com/datasets/aslanahmedov/walmart-sales-forecast/data
+SALES_FORECAST_REQ = f"""Train a model to predict sales for each department in every store (split the last 40 weeks records as validation dataset, the others is train dataset), include plot total sales trends, print metric and plot scatter plots of
+groud truth and predictions on validation data. Dataset is {DATA_DIR}/train.csv, the metric is weighted mean absolute error (WMAE) for test data. Notice: *print* key variables to get more information for next task step.
+"""
+
+REQUIREMENTS = {"wine": WINE_REQ, "sales_forecast": SALES_FORECAST_REQ}
+
+
+async def main(use_case: str = "wine"):
+    mi = DataInterpreter()
+    requirement = REQUIREMENTS[use_case]
+    await mi.run(requirement)
 
 
 if __name__ == "__main__":
diff --git a/examples/rag_pipeline.py b/examples/rag_pipeline.py
new file mode 100644
index 000000000..b5111b75c
--- /dev/null
+++ b/examples/rag_pipeline.py
@@ -0,0 +1,248 @@
+"""RAG pipeline"""
+
+import asyncio
+
+from pydantic import BaseModel
+
+from metagpt.const import DATA_PATH, EXAMPLE_DATA_PATH
+from metagpt.logs import logger
+from metagpt.rag.engines import SimpleEngine
+from metagpt.rag.schema import (
+    BM25RetrieverConfig,
+    ChromaIndexConfig,
+    ChromaRetrieverConfig,
+    ElasticsearchIndexConfig,
+    ElasticsearchRetrieverConfig,
+    ElasticsearchStoreConfig,
+    FAISSRetrieverConfig,
+    LLMRankerConfig,
+)
+from metagpt.utils.exceptions import handle_exception
+
+DOC_PATH = EXAMPLE_DATA_PATH / "rag/writer.txt"
+QUESTION = "What are key qualities to be a good writer?"
+
+TRAVEL_DOC_PATH = EXAMPLE_DATA_PATH / "rag/travel.txt"
+TRAVEL_QUESTION = "What does Bob like?"
+
+LLM_TIP = "If you not sure, just answer I don't know."
+
+
+class Player(BaseModel):
+    """To demonstrate rag add objs."""
+
+    name: str = ""
+    goal: str = "Win The 100-meter Sprint."
+    tool: str = "Red Bull Energy Drink."
+
+    def rag_key(self) -> str:
+        """For search"""
+        return self.goal
+
+
+class RAGExample:
+    """Show how to use RAG."""
+
+    def __init__(self, engine: SimpleEngine = None):
+        self._engine = engine
+
+    @property
+    def engine(self):
+        if not self._engine:
+            self._engine = SimpleEngine.from_docs(
+                input_files=[DOC_PATH],
+                retriever_configs=[FAISSRetrieverConfig(), BM25RetrieverConfig()],
+                ranker_configs=[LLMRankerConfig()],
+            )
+        return self._engine
+
+    @engine.setter
+    def engine(self, value: SimpleEngine):
+        self._engine = value
+
+    async def run_pipeline(self, question=QUESTION, print_title=True):
+        """This example run rag pipeline, use faiss&bm25 retriever and llm ranker, will print something like:
+
+        Retrieve Result:
+        0. Productivi..., 10.0
+        1. I wrote cu..., 7.0
+        2. I highly r..., 5.0
+
+        Query Result:
+        Passion, adaptability, open-mindedness, creativity, discipline, and empathy are key qualities to be a good writer.
+        """
+        if print_title:
+            self._print_title("Run Pipeline")
+
+        nodes = await self.engine.aretrieve(question)
+        self._print_retrieve_result(nodes)
+
+        answer = await self.engine.aquery(question)
+        self._print_query_result(answer)
+
+    async def add_docs(self):
+        """This example show how to add docs.
+
+        Before add docs llm anwser I don't know.
+        After add docs llm give the correct answer, will print something like:
+
+        [Before add docs]
+        Retrieve Result:
+
+        Query Result:
+        Empty Response
+
+        [After add docs]
+        Retrieve Result:
+        0. Bob like..., 10.0
+
+        Query Result:
+        Bob likes traveling.
+        """
+        self._print_title("Add Docs")
+
+        travel_question = f"{TRAVEL_QUESTION}{LLM_TIP}"
+        travel_filepath = TRAVEL_DOC_PATH
+
+        logger.info("[Before add docs]")
+        await self.run_pipeline(question=travel_question, print_title=False)
+
+        logger.info("[After add docs]")
+        self.engine.add_docs([travel_filepath])
+        await self.run_pipeline(question=travel_question, print_title=False)
+
+    @handle_exception
+    async def add_objects(self, print_title=True):
+        """This example show how to add objects.
+
+        Before add docs, engine retrieve nothing.
+        After add objects, engine give the correct answer, will print something like:
+
+        [Before add objs]
+        Retrieve Result:
+
+        [After add objs]
+        Retrieve Result:
+        0. 100m Sprin..., 10.0
+
+        [Object Detail]
+        {'name': 'Mike', 'goal': 'Win The 100-meter Sprint', 'tool': 'Red Bull Energy Drink'}
+        """
+        if print_title:
+            self._print_title("Add Objects")
+
+        player = Player(name="Mike")
+        question = f"{player.rag_key()}"
+
+        logger.info("[Before add objs]")
+        await self._retrieve_and_print(question)
+
+        logger.info("[After add objs]")
+        self.engine.add_objs([player])
+
+        try:
+            nodes = await self._retrieve_and_print(question)
+
+            logger.info("[Object Detail]")
+            player: Player = nodes[0].metadata["obj"]
+            logger.info(player.name)
+        except Exception as e:
+            logger.error(f"nodes is empty, llm don't answer correctly, exception: {e}")
+
+    async def init_objects(self):
+        """This example show how to from objs, will print something like:
+
+        Same as add_objects.
+        """
+        self._print_title("Init Objects")
+
+        pre_engine = self.engine
+        self.engine = SimpleEngine.from_objs(retriever_configs=[FAISSRetrieverConfig()])
+        await self.add_objects(print_title=False)
+        self.engine = pre_engine
+
+    async def init_and_query_chromadb(self):
+        """This example show how to use chromadb. how to save and load index. will print something like:
+
+        Query Result:
+        Bob likes traveling.
+        """
+        self._print_title("Init And Query ChromaDB")
+
+        # 1. save index
+        output_dir = DATA_PATH / "rag"
+        SimpleEngine.from_docs(
+            input_files=[TRAVEL_DOC_PATH],
+            retriever_configs=[ChromaRetrieverConfig(persist_path=output_dir)],
+        )
+
+        # 2. load index
+        engine = SimpleEngine.from_index(index_config=ChromaIndexConfig(persist_path=output_dir))
+
+        # 3. query
+        answer = await engine.aquery(TRAVEL_QUESTION)
+        self._print_query_result(answer)
+
+    @handle_exception
+    async def init_and_query_es(self):
+        """This example show how to use es. how to save and load index. will print something like:
+
+        Query Result:
+        Bob likes traveling.
+        """
+        self._print_title("Init And Query Elasticsearch")
+
+        # 1. create es index and save docs
+        store_config = ElasticsearchStoreConfig(index_name="travel", es_url="http://127.0.0.1:9200")
+        engine = SimpleEngine.from_docs(
+            input_files=[TRAVEL_DOC_PATH],
+            retriever_configs=[ElasticsearchRetrieverConfig(store_config=store_config)],
+        )
+
+        # 2. load index
+        engine = SimpleEngine.from_index(index_config=ElasticsearchIndexConfig(store_config=store_config))
+
+        # 3. query
+        answer = await engine.aquery(TRAVEL_QUESTION)
+        self._print_query_result(answer)
+
+    @staticmethod
+    def _print_title(title):
+        logger.info(f"{'#'*30} {title} {'#'*30}")
+
+    @staticmethod
+    def _print_retrieve_result(result):
+        """Print retrieve result."""
+        logger.info("Retrieve Result:")
+
+        for i, node in enumerate(result):
+            logger.info(f"{i}. {node.text[:10]}..., {node.score}")
+
+        logger.info("")
+
+    @staticmethod
+    def _print_query_result(result):
+        """Print query result."""
+        logger.info("Query Result:")
+
+        logger.info(f"{result}\n")
+
+    async def _retrieve_and_print(self, question):
+        nodes = await self.engine.aretrieve(question)
+        self._print_retrieve_result(nodes)
+        return nodes
+
+
+async def main():
+    """RAG pipeline"""
+    e = RAGExample()
+    await e.run_pipeline()
+    await e.add_docs()
+    await e.add_objects()
+    await e.init_objects()
+    await e.init_and_query_chromadb()
+    await e.init_and_query_es()
+
+
+if __name__ == "__main__":
+    asyncio.run(main())
diff --git a/examples/rag_search.py b/examples/rag_search.py
new file mode 100644
index 000000000..258c5ba60
--- /dev/null
+++ b/examples/rag_search.py
@@ -0,0 +1,21 @@
+"""Agent with RAG search."""
+
+import asyncio
+
+from examples.rag_pipeline import DOC_PATH, QUESTION
+from metagpt.logs import logger
+from metagpt.rag.engines import SimpleEngine
+from metagpt.roles import Sales
+
+
+async def search():
+    """Agent with RAG search."""
+
+    store = SimpleEngine.from_docs(input_files=[DOC_PATH])
+    role = Sales(profile="Sales", store=store)
+    result = await role.run(QUESTION)
+    logger.info(result)
+
+
+if __name__ == "__main__":
+    asyncio.run(search())
diff --git a/examples/search_kb.py b/examples/search_kb.py
deleted file mode 100644
index 995720cc1..000000000
--- a/examples/search_kb.py
+++ /dev/null
@@ -1,33 +0,0 @@
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-"""
-@File    : search_kb.py
-@Modified By: mashenquan, 2023-12-22. Delete useless codes.
-"""
-import asyncio
-
-from langchain.embeddings import OpenAIEmbeddings
-
-from metagpt.config2 import config
-from metagpt.const import DATA_PATH, EXAMPLE_PATH
-from metagpt.document_store import FaissStore
-from metagpt.logs import logger
-from metagpt.roles import Sales
-
-
-def get_store():
-    llm = config.get_openai_llm()
-    embedding = OpenAIEmbeddings(openai_api_key=llm.api_key, openai_api_base=llm.base_url)
-    return FaissStore(DATA_PATH / "example.json", embedding=embedding)
-
-
-async def search():
-    store = FaissStore(EXAMPLE_PATH / "example.json")
-    role = Sales(profile="Sales", store=store)
-    query = "Which facial cleanser is good for oily skin?"
-    result = await role.run(query)
-    logger.info(result)
-
-
-if __name__ == "__main__":
-    asyncio.run(search())
diff --git a/examples/search_with_specific_engine.py b/examples/search_with_specific_engine.py
index 1eee762d5..276431ed8 100644
--- a/examples/search_with_specific_engine.py
+++ b/examples/search_with_specific_engine.py
@@ -13,7 +13,7 @@ async def main():
     question = "What are the most interesting human facts?"
 
     search = Config.default().search
-    kwargs = {"api_key": search.api_key, "cse_id": search.cse_id, "proxy": None}
+    kwargs = search.model_dump()
     await Searcher(search_engine=SearchEngine(engine=search.api_type, **kwargs)).run(question)
 
 
diff --git a/metagpt/environment/android_env/__init__.py b/examples/stanford_town/__init__.py
similarity index 100%
rename from metagpt/environment/android_env/__init__.py
rename to examples/stanford_town/__init__.py
diff --git a/examples/stanford_town/requirements.txt b/examples/stanford_town/requirements.txt
new file mode 100644
index 000000000..e69de29bb
diff --git a/examples/stanford_town/run_st_game.py b/examples/stanford_town/run_st_game.py
new file mode 100644
index 000000000..732ae5efc
--- /dev/null
+++ b/examples/stanford_town/run_st_game.py
@@ -0,0 +1,93 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : entry of Stanford Town(ST/st) game
+
+import asyncio
+from typing import Optional
+
+import fire
+
+from metagpt.ext.stanford_town.roles.st_role import STRole
+from metagpt.ext.stanford_town.stanford_town import StanfordTown
+from metagpt.ext.stanford_town.utils.const import STORAGE_PATH
+from metagpt.ext.stanford_town.utils.mg_ga_transform import (
+    get_reverie_meta,
+    write_curr_sim_code,
+    write_curr_step,
+)
+from metagpt.ext.stanford_town.utils.utils import copy_folder
+from metagpt.logs import logger
+
+
+async def startup(
+    idea: str, fork_sim_code: str, sim_code: str, temp_storage_path: str, investment: float = 30.0, n_round: int = 500
+):
+    town = StanfordTown()
+    logger.info("StanfordTown init environment")
+
+    # copy `storage/{fork_sim_code}` to `storage/{sim_code}`
+    copy_folder(str(STORAGE_PATH.joinpath(fork_sim_code)), str(STORAGE_PATH.joinpath(sim_code)))
+
+    # get role names from `storage/{simulation_name}/reverie/meta.json` and then init roles
+    reverie_meta = get_reverie_meta(fork_sim_code)
+    roles = []
+    sim_path = STORAGE_PATH.joinpath(sim_code)
+    sim_path.mkdir(exist_ok=True)
+    for idx, role_name in enumerate(reverie_meta["persona_names"]):
+        has_inner_voice = True if idx == 0 else False
+        role = STRole(
+            name=role_name,
+            profile=role_name,
+            sim_code=sim_code,
+            step=reverie_meta.get("step", 0),
+            start_time=reverie_meta.get("start_date"),
+            curr_time=reverie_meta.get("curr_time"),
+            sec_per_step=reverie_meta.get("sec_per_step"),
+            has_inner_voice=has_inner_voice,
+        )
+        roles.append(role)
+
+    # init temp_storage
+    write_curr_sim_code({"sim_code": sim_code}, temp_storage_path)
+    write_curr_step({"step": reverie_meta.get("step", 0)}, temp_storage_path)
+
+    await town.hire(roles)
+
+    town.invest(investment)
+    town.run_project(idea)
+
+    await town.run(n_round)
+
+
+def main(
+    idea: str,
+    fork_sim_code: str,
+    sim_code: str,
+    temp_storage_path: Optional[str] = None,
+    investment: float = 30.0,
+    n_round: int = 500,
+):
+    """
+    Args:
+        idea: idea works as an `inner voice` to the first agent.
+        fork_sim_code: old simulation name to start with, choose one inside `generative_agents/environment/frontend_server/storage/`
+        sim_code: new simulation name to save simulation result
+        temp_storage_path: generative_agents temp_storage path inside `environment/frontend_server` to interact.
+        investment: the investment of running agents
+        n_round: rounds to run agents
+    """
+
+    asyncio.run(
+        startup(
+            idea=idea,
+            fork_sim_code=fork_sim_code,
+            sim_code=sim_code,
+            temp_storage_path=temp_storage_path,
+            investment=investment,
+            n_round=n_round,
+        )
+    )
+
+
+if __name__ == "__main__":
+    fire.Fire(main)
diff --git a/examples/stanford_town/storage/.gitignore b/examples/stanford_town/storage/.gitignore
new file mode 100644
index 000000000..962820861
--- /dev/null
+++ b/examples/stanford_town/storage/.gitignore
@@ -0,0 +1,4 @@
+# path to store simulation data
+test_*
+unittest*
+July*
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/environment/0.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/environment/0.json
new file mode 100644
index 000000000..6eaa46c51
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/environment/0.json
@@ -0,0 +1,26 @@
+{
+  "Isabella Rodriguez": {
+    "maze": "the_ville",
+    "x": 72,
+    "y": 14
+  },
+  "Klaus Mueller": {
+    "maze": "the_ville",
+    "x": 126,
+    "y": 46
+  },
+  "Maria Lopez": {
+    "maze": "the_ville",
+    "x": 123,
+    "y": 57
+  }
+}
+
+
+
+
+
+
+
+
+
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory/embeddings.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory/embeddings.json
new file mode 100644
index 000000000..9e26dfeeb
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory/embeddings.json	
@@ -0,0 +1 @@
+{}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory/kw_strength.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory/kw_strength.json
new file mode 100644
index 000000000..6dc73c1c8
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory/kw_strength.json	
@@ -0,0 +1,2 @@
+{"kw_strength_event": {},
+ "kw_strength_thought": {}}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory/nodes.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory/nodes.json
new file mode 100644
index 000000000..9e26dfeeb
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory/nodes.json	
@@ -0,0 +1 @@
+{}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/scratch.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/scratch.json
new file mode 100644
index 000000000..dbed4b705
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/scratch.json	
@@ -0,0 +1,51 @@
+{
+  "vision_r": 8, 
+  "att_bandwidth": 8, 
+  "retention": 8, 
+  "curr_time": null, 
+  "curr_tile": null, 
+  "daily_plan_req": "Isabella Rodriguez opens Hobbs Cafe at 8am everyday, and works at the counter until 8pm, at which point she closes the cafe.", 
+  "name": "Isabella Rodriguez", 
+  "first_name": "Isabella", 
+  "last_name": "Rodriguez", 
+  "age": 34, 
+  "innate": "friendly, outgoing, hospitable", 
+  "learned": "Isabella Rodriguez is a cafe owner of Hobbs Cafe who loves to make people feel welcome. She is always looking for ways to make the cafe a place where people can come to relax and enjoy themselves.", 
+  "currently": "Isabella Rodriguez is planning on having a Valentine's Day party at Hobbs Cafe with her customers on February 14th, 2023 at 5pm. She is gathering party material, and is telling everyone to join the party at Hobbs Cafe on February 14th, 2023, from 5pm to 7pm.", 
+  "lifestyle": "Isabella Rodriguez goes to bed around 11pm, awakes up around 6am.", 
+  "living_area": "the Ville:Isabella Rodriguez's apartment:main room",
+  "concept_forget": 100,
+  "daily_reflection_time": 180,
+  "daily_reflection_size": 5,
+  "overlap_reflect_th": 4,
+  "kw_strg_event_reflect_th": 10, 
+  "kw_strg_thought_reflect_th": 9, 
+
+  "recency_w": 1,
+  "relevance_w": 1,
+  "importance_w": 1,
+  "recency_decay": 0.995,
+  "importance_trigger_max": 150,
+  "importance_trigger_curr": 150,
+  "importance_ele_n": 0, 
+  "thought_count": 5, 
+
+  "daily_req": [], 
+  "f_daily_schedule": [],
+  "f_daily_schedule_hourly_org": [],
+  "act_address": null, 
+  "act_start_time": null, 
+  "act_duration": null, 
+  "act_description": null, 
+  "act_pronunciatio": null, 
+  "act_event": ["Isabella Rodriguez", null, null], 
+  "act_obj_description": null, 
+  "act_obj_pronunciatio": null, 
+  "act_obj_event": [null, null, null], 
+  "chatting_with": null, 
+  "chat": null,
+  "chatting_with_buffer": {}, 
+  "chatting_end_time": null,
+  "act_path_set": false, 
+  "planned_path": []
+}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/spatial_memory.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/spatial_memory.json
new file mode 100644
index 000000000..f88157950
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/spatial_memory.json	
@@ -0,0 +1,66 @@
+{
+  "the Ville": {
+    "Hobbs Cafe": {
+      "cafe": [
+        "refrigerator",
+        "cafe customer seating",
+        "cooking area",
+        "kitchen sink",
+        "behind the cafe counter",
+        "piano"
+      ]
+    },
+    "Isabella Rodriguez's apartment": {
+      "main room": [
+        "bed",
+        "desk",
+        "refrigerator",
+        "closet",
+        "shelf"
+      ]
+    },
+    "The Rose and Crown Pub": {
+      "pub": [
+        "shelf",
+        "refrigerator",
+        "bar customer seating",
+        "behind the bar counter",
+        "kitchen sink",
+        "cooking area",
+        "microphone"
+      ]
+    },
+    "Harvey Oak Supply Store": {
+      "supply store": [
+        "supply store product shelf",
+        "behind the supply store counter",
+        "supply store counter"
+      ]
+    },
+    "The Willows Market and Pharmacy": {
+      "store": [
+        "behind the pharmacy counter",
+        "pharmacy store shelf",
+        "pharmacy store counter",
+        "grocery store shelf",
+        "behind the grocery counter",
+        "grocery store counter"
+      ]
+    },
+    "Dorm for Oak Hill College": {
+      "garden": [
+        "dorm garden"
+      ],
+      "common room": [
+        "common room sofa",
+        "pool table",
+        "common room table"
+      ]
+    },
+    "Johnson Park": {
+      "park": [
+        "park garden"
+      ]
+    }
+  }
+}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/associative_memory/embeddings.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/associative_memory/embeddings.json
new file mode 100644
index 000000000..9e26dfeeb
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/associative_memory/embeddings.json	
@@ -0,0 +1 @@
+{}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/associative_memory/kw_strength.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/associative_memory/kw_strength.json
new file mode 100644
index 000000000..6dc73c1c8
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/associative_memory/kw_strength.json	
@@ -0,0 +1,2 @@
+{"kw_strength_event": {},
+ "kw_strength_thought": {}}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/associative_memory/nodes.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/associative_memory/nodes.json
new file mode 100644
index 000000000..9e26dfeeb
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/associative_memory/nodes.json	
@@ -0,0 +1 @@
+{}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/scratch.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/scratch.json
new file mode 100644
index 000000000..7b0ce7d72
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/scratch.json	
@@ -0,0 +1,51 @@
+{
+  "vision_r": 8, 
+  "att_bandwidth": 8, 
+  "retention": 8, 
+  "curr_time": null, 
+  "curr_tile": null, 
+  "daily_plan_req": "Klaus Mueller goes to the library at Oak Hill College early in the morning, spends his days writing, and eats at Hobbs Cafe.", 
+  "name": "Klaus Mueller", 
+  "first_name": "Klaus", 
+  "last_name": "Mueller", 
+  "age": 20,
+  "innate": "kind, inquisitive, passionate", 
+  "learned": "Klaus Mueller is a student at Oak Hill College studying sociology. He is passionate about social justice and loves to explore different perspectives.", 
+  "currently": "Klaus Mueller is writing a research paper on the effects of gentrification in low-income communities.", 
+  "lifestyle": "Klaus Mueller goes to bed around 11pm, awakes up around 7am, eats dinner around 5pm.", 
+  "living_area": "the Ville:Dorm for Oak Hill College:Klaus Mueller's room",
+  "concept_forget": 100,
+  "daily_reflection_time": 180,
+  "daily_reflection_size": 5,
+  "overlap_reflect_th": 4,
+  "kw_strg_event_reflect_th": 10, 
+  "kw_strg_thought_reflect_th": 9, 
+
+  "recency_w": 1,
+  "relevance_w": 1,
+  "importance_w": 1,
+  "recency_decay": 0.99,
+  "importance_trigger_max": 150,
+  "importance_trigger_curr": 150,
+  "importance_ele_n": 0, 
+  "thought_count": 5, 
+  
+  "daily_req": [], 
+  "f_daily_schedule": [],
+  "f_daily_schedule_hourly_org": [],
+  "act_address": null, 
+  "act_start_time": null, 
+  "act_duration": null, 
+  "act_description": null, 
+  "act_pronunciatio": null, 
+  "act_event": ["Klaus Mueller", null, null], 
+  "act_obj_description": null, 
+  "act_obj_pronunciatio": null, 
+  "act_obj_event": [null, null, null], 
+  "chatting_with": null, 
+  "chat": null,
+  "chatting_with_buffer": {}, 
+  "chatting_end_time": null,
+  "act_path_set": false, 
+  "planned_path": []
+}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/spatial_memory.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/spatial_memory.json
new file mode 100644
index 000000000..4f4168677
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Klaus Mueller/bootstrap_memory/spatial_memory.json	
@@ -0,0 +1,86 @@
+{
+  "the Ville": {
+    "Oak Hill College": {
+      "hallway": [],
+      "library": [
+        "library sofa",
+        "library table",
+        "bookshelf"
+      ],
+      "classroom": [
+        "blackboard",
+        "classroom podium",
+        "classroom student seating"
+      ]
+    },
+    "Dorm for Oak Hill College": {
+      "garden": [
+        "dorm garden"
+      ],
+      "Klaus Mueller's room": [
+        "bed",
+        "game console",
+        "closet",
+        "desk"
+      ],
+      "woman's bathroom": [
+        "toilet",
+        "shower",
+        "bathroom sink"
+      ],
+      "common room": [
+        "common room sofa",
+        "pool table",
+        "common room table"
+      ],
+      "man's bathroom": [
+        "shower",
+        "bathroom sink",
+        "toilet"
+      ]
+    },
+    "The Willows Market and Pharmacy": {
+      "store": [
+        "grocery store shelf",
+        "behind the grocery counter",
+        "grocery store counter",
+        "pharmacy store shelf",
+        "pharmacy store counter",
+        "behind the pharmacy counter"
+      ]
+    },
+    "Harvey Oak Supply Store": {
+      "supply store": [
+        "supply store product shelf",
+        "behind the supply store counter",
+        "supply store counter"
+      ]
+    },
+    "Johnson Park": {
+      "park": [
+        "park garden"
+      ]
+    },
+    "The Rose and Crown Pub": {
+      "pub": [
+        "shelf",
+        "refrigerator",
+        "bar customer seating",
+        "behind the bar counter",
+        "kitchen sink",
+        "cooking area",
+        "microphone"
+      ]
+    },
+    "Hobbs Cafe": {
+      "cafe": [
+        "refrigerator",
+        "cafe customer seating",
+        "cooking area",
+        "kitchen sink",
+        "behind the cafe counter",
+        "piano"
+      ]
+    }
+  }
+}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/associative_memory/embeddings.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/associative_memory/embeddings.json
new file mode 100644
index 000000000..9e26dfeeb
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/associative_memory/embeddings.json	
@@ -0,0 +1 @@
+{}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/associative_memory/kw_strength.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/associative_memory/kw_strength.json
new file mode 100644
index 000000000..6dc73c1c8
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/associative_memory/kw_strength.json	
@@ -0,0 +1,2 @@
+{"kw_strength_event": {},
+ "kw_strength_thought": {}}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/associative_memory/nodes.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/associative_memory/nodes.json
new file mode 100644
index 000000000..9e26dfeeb
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/associative_memory/nodes.json	
@@ -0,0 +1 @@
+{}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/scratch.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/scratch.json
new file mode 100644
index 000000000..c3a304952
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/scratch.json	
@@ -0,0 +1,51 @@
+{
+  "vision_r": 8, 
+  "att_bandwidth": 8, 
+  "retention": 8, 
+  "curr_time": null, 
+  "curr_tile": null, 
+  "daily_plan_req": "Maria Lopez spends at least 3 hours a day Twitch streaming or gaming.", 
+  "name": "Maria Lopez", 
+  "first_name": "Maria", 
+  "last_name": "Lopez", 
+  "age": 21,
+  "innate": "energetic, enthusiastic, inquisitive", 
+  "learned": "Maria Lopez is a student at Oak Hill College studying physics and a part time Twitch game streamer who loves to connect with people and explore new ideas.", 
+  "currently": "Maria Lopez is working on her physics degree and streaming games on Twitch to make some extra money. She visits Hobbs Cafe for studying and eating just about everyday.", 
+  "lifestyle": "Maria Lopez goes to bed around 2am, awakes up around 9am, eats dinner around 6pm. She likes to hang out at Hobbs Cafe if it's before 6pm.", 
+  "living_area": "the Ville:Dorm for Oak Hill College:Maria Lopez's room",
+  "concept_forget": 100,
+  "daily_reflection_time": 180,
+  "daily_reflection_size": 5,
+  "overlap_reflect_th": 4,
+  "kw_strg_event_reflect_th": 10, 
+  "kw_strg_thought_reflect_th": 9, 
+
+  "recency_w": 1,
+  "relevance_w": 1,
+  "importance_w": 1,
+  "recency_decay": 0.99,
+  "importance_trigger_max": 150,
+  "importance_trigger_curr": 150,
+  "importance_ele_n": 0, 
+  "thought_count": 5, 
+  
+  "daily_req": [], 
+  "f_daily_schedule": [],
+  "f_daily_schedule_hourly_org": [],
+  "act_address": null, 
+  "act_start_time": null, 
+  "act_duration": null, 
+  "act_description": null, 
+  "act_pronunciatio": null, 
+  "act_event": ["Maria Lopez", null, null], 
+  "act_obj_description": null, 
+  "act_obj_pronunciatio": null, 
+  "act_obj_event": [null, null, null], 
+  "chatting_with": null, 
+  "chat": null,
+  "chatting_with_buffer": {}, 
+  "chatting_end_time": null,
+  "act_path_set": false, 
+  "planned_path": []
+}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/spatial_memory.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/spatial_memory.json
new file mode 100644
index 000000000..0a58212bd
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/personas/Maria Lopez/bootstrap_memory/spatial_memory.json	
@@ -0,0 +1,87 @@
+{
+  "the Ville": {
+    "Oak Hill College": {
+      "hallway": [],
+      "library": [
+        "library sofa",
+        "library table",
+        "bookshelf"
+      ],
+      "classroom": [
+        "blackboard",
+        "classroom podium",
+        "classroom student seating"
+      ]
+    },
+    "Dorm for Oak Hill College": {
+      "garden": [
+        "dorm garden"
+      ],
+      "Maria Lopez's room": [
+        "closet",
+        "desk",
+        "bed",
+        "computer",
+        "blackboard"
+      ],
+      "woman's bathroom": [
+        "toilet",
+        "shower",
+        "bathroom sink"
+      ],
+      "common room": [
+        "common room sofa",
+        "pool table",
+        "common room table"
+      ],
+      "man's bathroom": [
+        "shower",
+        "bathroom sink",
+        "toilet"
+      ]
+    },
+    "The Willows Market and Pharmacy": {
+      "store": [
+        "grocery store shelf",
+        "behind the grocery counter",
+        "grocery store counter",
+        "pharmacy store shelf",
+        "pharmacy store counter",
+        "behind the pharmacy counter"
+      ]
+    },
+    "Harvey Oak Supply Store": {
+      "supply store": [
+        "supply store product shelf",
+        "behind the supply store counter",
+        "supply store counter"
+      ]
+    },
+    "Johnson Park": {
+      "park": [
+        "park garden"
+      ]
+    },
+    "The Rose and Crown Pub": {
+      "pub": [
+        "shelf",
+        "refrigerator",
+        "bar customer seating",
+        "behind the bar counter",
+        "kitchen sink",
+        "cooking area",
+        "microphone"
+      ]
+    },
+    "Hobbs Cafe": {
+      "cafe": [
+        "refrigerator",
+        "cafe customer seating",
+        "cooking area",
+        "kitchen sink",
+        "behind the cafe counter",
+        "piano"
+      ]
+    }
+  }
+}
\ No newline at end of file
diff --git a/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/reverie/meta.json b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/reverie/meta.json
new file mode 100644
index 000000000..1e81ec12d
--- /dev/null
+++ b/examples/stanford_town/storage/base_the_ville_isabella_maria_klaus/reverie/meta.json
@@ -0,0 +1,13 @@
+{
+  "fork_sim_code": "base_the_ville_isabella_maria_klaus",
+  "start_date": "February 13, 2023",
+  "curr_time": "February 13, 2023, 00:00:00",
+  "sec_per_step": 10,
+  "maze_name": "the_ville",
+  "persona_names": [
+    "Isabella Rodriguez", 
+    "Maria Lopez",
+    "Klaus Mueller"    
+  ],
+  "step": 0
+}
\ No newline at end of file
diff --git a/metagpt/actions/action_node.py b/metagpt/actions/action_node.py
index 09da4a988..31e4cc0fc 100644
--- a/metagpt/actions/action_node.py
+++ b/metagpt/actions/action_node.py
@@ -17,6 +17,7 @@ from pydantic import BaseModel, Field, create_model, model_validator
 from tenacity import retry, stop_after_attempt, wait_random_exponential
 
 from metagpt.actions.action_outcls_registry import register_action_outcls
+from metagpt.const import USE_CONFIG_TIMEOUT
 from metagpt.llm import BaseLLM
 from metagpt.logs import logger
 from metagpt.provider.postprocess.llm_output_postprocess import llm_output_postprocess
@@ -330,7 +331,7 @@ class ActionNode:
 
     def compile_to(self, i: Dict, schema, kv_sep) -> str:
         if schema == "json":
-            return json.dumps(i, indent=4)
+            return json.dumps(i, indent=4, ensure_ascii=False)
         elif schema == "markdown":
             return dict_to_markdown(i, kv_sep=kv_sep)
         else:
@@ -339,10 +340,7 @@ class ActionNode:
     def tagging(self, text, schema, tag="") -> str:
         if not tag:
             return text
-        if schema == "json":
-            return f"[{tag}]\n" + text + f"\n[/{tag}]"
-        else:  # markdown
-            return f"[{tag}]\n" + text + f"\n[/{tag}]"
+        return f"[{tag}]\n{text}\n[/{tag}]"
 
     def _compile_f(self, schema, mode, tag, format_func, kv_sep, exclude=None) -> str:
         nodes = self.to_dict(format_func=format_func, mode=mode, exclude=exclude)
@@ -374,7 +372,7 @@ class ActionNode:
             schema="markdown": 编译context, example(markdown), instruction(markdown), constraint, action
         """
         if schema == "raw":
-            return context + "\n\n## Actions\n" + LANGUAGE_CONSTRAINT + "\n" + self.instruction
+            return f"{context}\n\n## Actions\n{LANGUAGE_CONSTRAINT}\n{self.instruction}"
 
         ### 直接使用 pydantic BaseModel 生成 instruction 与 example，仅限 JSON
         # child_class = self._create_children_class()
@@ -416,7 +414,7 @@ class ActionNode:
         images: Optional[Union[str, list[str]]] = None,
         system_msgs: Optional[list[str]] = None,
         schema="markdown",  # compatible to original format
-        timeout=3,
+        timeout=USE_CONFIG_TIMEOUT,
     ) -> (str, BaseModel):
         """Use ActionOutput to wrap the output of aask"""
         content = await self.llm.aask(prompt, system_msgs, images=images, timeout=timeout)
@@ -448,7 +446,9 @@ class ActionNode:
     def set_context(self, context):
         self.set_recursive("context", context)
 
-    async def simple_fill(self, schema, mode, images: Optional[Union[str, list[str]]] = None, timeout=3, exclude=None):
+    async def simple_fill(
+        self, schema, mode, images: Optional[Union[str, list[str]]] = None, timeout=USE_CONFIG_TIMEOUT, exclude=None
+    ):
         prompt = self.compile(context=self.context, schema=schema, mode=mode, exclude=exclude)
 
         if schema != "raw":
@@ -473,7 +473,7 @@ class ActionNode:
         mode="auto",
         strgy="simple",
         images: Optional[Union[str, list[str]]] = None,
-        timeout=3,
+        timeout=USE_CONFIG_TIMEOUT,
         exclude=[],
     ):
         """Fill the node(s) with mode.
diff --git a/metagpt/actions/di/execute_nb_code.py b/metagpt/actions/di/execute_nb_code.py
index f6a8defbd..0cf16b70f 100644
--- a/metagpt/actions/di/execute_nb_code.py
+++ b/metagpt/actions/di/execute_nb_code.py
@@ -57,8 +57,23 @@ class ExecuteNbCode(Action):
 
     async def terminate(self):
         """kill NotebookClient"""
-        if self.nb_client.km is not None:
-            await self.nb_client._async_cleanup_kernel()
+        if self.nb_client.km is not None and await self.nb_client.km.is_alive():
+            await self.nb_client.km.shutdown_kernel(now=True)
+            await self.nb_client.km.cleanup_resources()
+
+            channels = [
+                self.nb_client.kc.stdin_channel,  # The channel for handling standard input to the kernel.
+                self.nb_client.kc.hb_channel,  # The channel for heartbeat communication between the kernel and client.
+                self.nb_client.kc.control_channel,  # The channel for controlling the kernel.
+            ]
+
+            # Stops all the running channels for this kernel
+            for channel in channels:
+                if channel.is_alive():
+                    channel.stop()
+
+            self.nb_client.kc = None
+            self.nb_client.km = None
 
     async def reset(self):
         """reset NotebookClient"""
diff --git a/metagpt/actions/di/write_analysis_code.py b/metagpt/actions/di/write_analysis_code.py
index 185926e31..711e56d39 100644
--- a/metagpt/actions/di/write_analysis_code.py
+++ b/metagpt/actions/di/write_analysis_code.py
@@ -18,7 +18,7 @@ from metagpt.prompts.di.write_analysis_code import (
     STRUCTUAL_PROMPT,
 )
 from metagpt.schema import Message, Plan
-from metagpt.utils.common import CodeParser, process_message, remove_comments
+from metagpt.utils.common import CodeParser, remove_comments
 
 
 class WriteAnalysisCode(Action):
@@ -50,7 +50,7 @@ class WriteAnalysisCode(Action):
         )
 
         working_memory = working_memory or []
-        context = process_message([Message(content=structual_prompt, role="user")] + working_memory)
+        context = self.llm.format_msg([Message(content=structual_prompt, role="user")] + working_memory)
 
         # LLM call
         if use_reflection:
diff --git a/metagpt/actions/research.py b/metagpt/actions/research.py
index ce8d8a967..2a99a8d99 100644
--- a/metagpt/actions/research.py
+++ b/metagpt/actions/research.py
@@ -134,7 +134,7 @@ class CollectLinks(Action):
                     break
 
         model_name = config.llm.model
-        prompt = reduce_message_length(gen_msg(), model_name, system_text, 4096)
+        prompt = reduce_message_length(gen_msg(), model_name, system_text, config.llm.max_token)
         logger.debug(prompt)
         queries = await self._aask(prompt, [system_text])
         try:
diff --git a/metagpt/config2.py b/metagpt/config2.py
index bc6af18c6..f3273419f 100644
--- a/metagpt/config2.py
+++ b/metagpt/config2.py
@@ -92,7 +92,7 @@ class Config(CLIParams, YamlModel):
         """
         default_config_paths: List[Path] = [
             METAGPT_ROOT / "config/config2.yaml",
-            Path.home() / ".metagpt/config2.yaml",
+            CONFIG_ROOT / "config2.yaml",
         ]
 
         dicts = [dict(os.environ)]
@@ -100,6 +100,20 @@ class Config(CLIParams, YamlModel):
         final = merge_dict(dicts)
         return Config(**final)
 
+    @classmethod
+    def from_llm_config(cls, llm_config: dict):
+        """user config llm
+        example:
+        llm_config = {"api_type": "xxx", "api_key": "xxx", "model": "xxx"}
+        gpt4 = Config.from_llm_config(llm_config)
+        A = Role(name="A", profile="Democratic candidate", goal="Win the election", actions=[a1], watch=[a2], config=gpt4)
+        """
+        llm_config = LLMConfig.model_validate(llm_config)
+        dicts = [dict(os.environ)]
+        dicts += [{"llm": llm_config}]
+        final = merge_dict(dicts)
+        return Config(**final)
+
     def update_via_cli(self, project_path, project_name, inc, reqa_file, max_auto_summarize_code):
         """update config via cli"""
 
diff --git a/metagpt/configs/llm_config.py b/metagpt/configs/llm_config.py
index 77bfc8466..af8f56372 100644
--- a/metagpt/configs/llm_config.py
+++ b/metagpt/configs/llm_config.py
@@ -10,6 +10,7 @@ from typing import Optional
 
 from pydantic import field_validator
 
+from metagpt.const import LLM_API_TIMEOUT
 from metagpt.utils.yaml_model import YamlModel
 
 
@@ -29,6 +30,7 @@ class LLMType(Enum):
     DASHSCOPE = "dashscope"  # Aliyun LingJi DashScope
     MOONSHOT = "moonshot"
     MISTRAL = "mistral"
+    YI = "yi"  # lingyiwanwu
 
     def __missing__(self, key):
         return self.OPENAI
@@ -73,7 +75,7 @@ class LLMConfig(YamlModel):
     stream: bool = False
     logprobs: Optional[bool] = None  # https://cookbook.openai.com/examples/using_logprobs
     top_logprobs: Optional[int] = None
-    timeout: int = 60
+    timeout: int = 600
 
     # For Network
     proxy: Optional[str] = None
@@ -87,3 +89,8 @@ class LLMConfig(YamlModel):
         if v in ["", None, "YOUR_API_KEY"]:
             raise ValueError("Please set your API key in config2.yaml")
         return v
+
+    @field_validator("timeout")
+    @classmethod
+    def check_timeout(cls, v):
+        return v or LLM_API_TIMEOUT
diff --git a/metagpt/configs/search_config.py b/metagpt/configs/search_config.py
index af928b02a..e28b14c99 100644
--- a/metagpt/configs/search_config.py
+++ b/metagpt/configs/search_config.py
@@ -7,6 +7,8 @@
 """
 from typing import Callable, Optional
 
+from pydantic import Field
+
 from metagpt.tools import SearchEngineType
 from metagpt.utils.yaml_model import YamlModel
 
@@ -18,3 +20,11 @@ class SearchConfig(YamlModel):
     api_key: str = ""
     cse_id: str = ""  # for google
     search_func: Optional[Callable] = None
+    params: dict = Field(
+        default_factory=lambda: {
+            "engine": "google",
+            "google_domain": "google.com",
+            "gl": "us",
+            "hl": "en",
+        }
+    )
diff --git a/metagpt/const.py b/metagpt/const.py
index a5e3ea9c2..e4cebfd96 100644
--- a/metagpt/const.py
+++ b/metagpt/const.py
@@ -49,6 +49,7 @@ METAGPT_ROOT = get_metagpt_root()  # Dependent on METAGPT_PROJECT_ROOT
 DEFAULT_WORKSPACE_ROOT = METAGPT_ROOT / "workspace"
 
 EXAMPLE_PATH = METAGPT_ROOT / "examples"
+EXAMPLE_DATA_PATH = EXAMPLE_PATH / "data"
 DATA_PATH = METAGPT_ROOT / "data"
 TEST_DATA_PATH = METAGPT_ROOT / "tests/data"
 RESEARCH_PATH = DATA_PATH / "research"
@@ -122,7 +123,6 @@ BASE64_FORMAT = "base64"
 
 # REDIS
 REDIS_KEY = "REDIS_KEY"
-LLM_API_TIMEOUT = 300
 
 # Message id
 IGNORED_MESSAGE_ID = "0"
@@ -131,3 +131,7 @@ IGNORED_MESSAGE_ID = "0"
 GENERALIZATION = "Generalize"
 COMPOSITION = "Composite"
 AGGREGATION = "Aggregate"
+
+# Timeout
+USE_CONFIG_TIMEOUT = 0  # Using llm.timeout configuration.
+LLM_API_TIMEOUT = 300
diff --git a/metagpt/document.py b/metagpt/document.py
index 1a3c4b2f8..4a8bb68d5 100644
--- a/metagpt/document.py
+++ b/metagpt/document.py
@@ -11,12 +11,9 @@ from pathlib import Path
 from typing import Optional, Union
 
 import pandas as pd
-from langchain.text_splitter import CharacterTextSplitter
-from langchain_community.document_loaders import (
-    TextLoader,
-    UnstructuredPDFLoader,
-    UnstructuredWordDocumentLoader,
-)
+from llama_index.core import Document, SimpleDirectoryReader
+from llama_index.core.node_parser import SimpleNodeParser
+from llama_index.readers.file import PDFReader
 from pydantic import BaseModel, ConfigDict, Field
 from tqdm import tqdm
 
@@ -29,7 +26,7 @@ def validate_cols(content_col: str, df: pd.DataFrame):
         raise ValueError("Content column not found in DataFrame.")
 
 
-def read_data(data_path: Path):
+def read_data(data_path: Path) -> Union[pd.DataFrame, list[Document]]:
     suffix = data_path.suffix
     if ".xlsx" == suffix:
         data = pd.read_excel(data_path)
@@ -38,14 +35,13 @@ def read_data(data_path: Path):
     elif ".json" == suffix:
         data = pd.read_json(data_path)
     elif suffix in (".docx", ".doc"):
-        data = UnstructuredWordDocumentLoader(str(data_path), mode="elements").load()
+        data = SimpleDirectoryReader(input_files=[str(data_path)]).load_data()
     elif ".txt" == suffix:
-        data = TextLoader(str(data_path)).load()
-        text_splitter = CharacterTextSplitter(separator="\n", chunk_size=256, chunk_overlap=0)
-        texts = text_splitter.split_documents(data)
-        data = texts
+        data = SimpleDirectoryReader(input_files=[str(data_path)]).load_data()
+        node_parser = SimpleNodeParser.from_defaults(separator="\n", chunk_size=256, chunk_overlap=0)
+        data = node_parser.get_nodes_from_documents(data)
     elif ".pdf" == suffix:
-        data = UnstructuredPDFLoader(str(data_path), mode="elements").load()
+        data = PDFReader.load_data(str(data_path))
     else:
         raise NotImplementedError("File format not supported.")
     return data
@@ -150,9 +146,9 @@ class IndexableDocument(Document):
                 metadatas.append({})
         return docs, metadatas
 
-    def _get_docs_and_metadatas_by_langchain(self) -> (list, list):
+    def _get_docs_and_metadatas_by_llamaindex(self) -> (list, list):
         data = self.data
-        docs = [i.page_content for i in data]
+        docs = [i.text for i in data]
         metadatas = [i.metadata for i in data]
         return docs, metadatas
 
@@ -160,7 +156,7 @@ class IndexableDocument(Document):
         if isinstance(self.data, pd.DataFrame):
             return self._get_docs_and_metadatas_by_df()
         elif isinstance(self.data, list):
-            return self._get_docs_and_metadatas_by_langchain()
+            return self._get_docs_and_metadatas_by_llamaindex()
         else:
             raise NotImplementedError("Data type not supported for metadata extraction.")
 
diff --git a/metagpt/document_store/base_store.py b/metagpt/document_store/base_store.py
index ddc1d626b..6aafc57bb 100644
--- a/metagpt/document_store/base_store.py
+++ b/metagpt/document_store/base_store.py
@@ -38,9 +38,9 @@ class LocalStore(BaseStore, ABC):
         if not self.store:
             self.store = self.write()
 
-    def _get_index_and_store_fname(self, index_ext=".index", pkl_ext=".pkl"):
-        index_file = self.cache_dir / f"{self.fname}{index_ext}"
-        store_file = self.cache_dir / f"{self.fname}{pkl_ext}"
+    def _get_index_and_store_fname(self, index_ext=".json", docstore_ext=".json"):
+        index_file = self.cache_dir / "default__vector_store" / index_ext
+        store_file = self.cache_dir / "docstore" / docstore_ext
         return index_file, store_file
 
     @abstractmethod
diff --git a/metagpt/document_store/chromadb_store.py b/metagpt/document_store/chromadb_store.py
index d7344d41b..1d3a014ee 100644
--- a/metagpt/document_store/chromadb_store.py
+++ b/metagpt/document_store/chromadb_store.py
@@ -11,9 +11,9 @@ import chromadb
 class ChromaStore:
     """If inherited from BaseStore, or importing other modules from metagpt, a Python exception occurs, which is strange."""
 
-    def __init__(self, name):
+    def __init__(self, name: str, get_or_create: bool = False):
         client = chromadb.Client()
-        collection = client.create_collection(name)
+        collection = client.create_collection(name, get_or_create=get_or_create)
         self.client = client
         self.collection = collection
 
diff --git a/metagpt/document_store/faiss_store.py b/metagpt/document_store/faiss_store.py
index 2359917d5..b196bef27 100644
--- a/metagpt/document_store/faiss_store.py
+++ b/metagpt/document_store/faiss_store.py
@@ -7,10 +7,14 @@
 """
 import asyncio
 from pathlib import Path
-from typing import Optional
+from typing import Any, Optional
 
-from langchain.vectorstores import FAISS
-from langchain_core.embeddings import Embeddings
+import faiss
+from llama_index.core import VectorStoreIndex, load_index_from_storage
+from llama_index.core.embeddings import BaseEmbedding
+from llama_index.core.schema import Document, QueryBundle, TextNode
+from llama_index.core.storage import StorageContext
+from llama_index.vector_stores.faiss import FaissVectorStore
 
 from metagpt.document import IndexableDocument
 from metagpt.document_store.base_store import LocalStore
@@ -20,36 +24,50 @@ from metagpt.utils.embedding import get_embedding
 
 class FaissStore(LocalStore):
     def __init__(
-        self, raw_data: Path, cache_dir=None, meta_col="source", content_col="output", embedding: Embeddings = None
+        self, raw_data: Path, cache_dir=None, meta_col="source", content_col="output", embedding: BaseEmbedding = None
     ):
         self.meta_col = meta_col
         self.content_col = content_col
         self.embedding = embedding or get_embedding()
+        self.store: VectorStoreIndex
         super().__init__(raw_data, cache_dir)
 
-    def _load(self) -> Optional["FaissStore"]:
-        index_file, store_file = self._get_index_and_store_fname(index_ext=".faiss")  # langchain FAISS using .faiss
+    def _load(self) -> Optional["VectorStoreIndex"]:
+        index_file, store_file = self._get_index_and_store_fname()
 
         if not (index_file.exists() and store_file.exists()):
             logger.info("Missing at least one of index_file/store_file, load failed and return None")
             return None
+        vector_store = FaissVectorStore.from_persist_dir(persist_dir=self.cache_dir)
+        storage_context = StorageContext.from_defaults(persist_dir=self.cache_dir, vector_store=vector_store)
+        index = load_index_from_storage(storage_context, embed_model=self.embedding)
 
-        return FAISS.load_local(self.raw_data_path.parent, self.embedding, self.fname)
+        return index
 
-    def _write(self, docs, metadatas):
-        store = FAISS.from_texts(docs, self.embedding, metadatas=metadatas)
-        return store
+    def _write(self, docs: list[str], metadatas: list[dict[str, Any]]) -> VectorStoreIndex:
+        assert len(docs) == len(metadatas)
+        documents = [Document(text=doc, metadata=metadatas[idx]) for idx, doc in enumerate(docs)]
+
+        vector_store = FaissVectorStore(faiss_index=faiss.IndexFlatL2(1536))
+        storage_context = StorageContext.from_defaults(vector_store=vector_store)
+        index = VectorStoreIndex.from_documents(
+            documents=documents, storage_context=storage_context, embed_model=self.embedding
+        )
+
+        return index
 
     def persist(self):
-        self.store.save_local(self.raw_data_path.parent, self.fname)
+        self.store.storage_context.persist(self.cache_dir)
+
+    def search(self, query: str, expand_cols=False, sep="\n", *args, k=5, **kwargs):
+        retriever = self.store.as_retriever(similarity_top_k=k)
+        rsp = retriever.retrieve(QueryBundle(query_str=query, embedding=self.embedding.get_text_embedding(query)))
 
-    def search(self, query, expand_cols=False, sep="\n", *args, k=5, **kwargs):
-        rsp = self.store.similarity_search(query, k=k, **kwargs)
         logger.debug(rsp)
         if expand_cols:
-            return str(sep.join([f"{x.page_content}: {x.metadata}" for x in rsp]))
+            return str(sep.join([f"{x.node.text}: {x.node.metadata}" for x in rsp]))
         else:
-            return str(sep.join([f"{x.page_content}" for x in rsp]))
+            return str(sep.join([f"{x.node.text}" for x in rsp]))
 
     async def asearch(self, *args, **kwargs):
         return await asyncio.to_thread(self.search, *args, **kwargs)
@@ -67,8 +85,12 @@ class FaissStore(LocalStore):
 
     def add(self, texts: list[str], *args, **kwargs) -> list[str]:
         """FIXME: Currently, the store is not updated after adding."""
-        return self.store.add_texts(texts)
+        texts_embeds = self.embedding.get_text_embedding_batch(texts)
+        nodes = [TextNode(text=texts[idx], embedding=embed) for idx, embed in enumerate(texts_embeds)]
+        self.store.insert_nodes(nodes)
+
+        return []
 
     def delete(self, *args, **kwargs):
-        """Currently, langchain does not provide a delete interface."""
+        """Currently, faiss does not provide a delete interface."""
         raise NotImplementedError
diff --git a/metagpt/environment/README.md b/metagpt/environment/README.md
index 9476ac75a..bb7d50d50 100644
--- a/metagpt/environment/README.md
+++ b/metagpt/environment/README.md
@@ -21,7 +21,7 @@ ## Usage
 from metagpt.environment.api.env_api import EnvAPIAbstract
 
 # get screenshot from ExtEnv
-screenshot_path: Path = env.observe(
+screenshot_path: Path = await env.observe(
             EnvAPIAbstract(
                 api_name="get_screenshot", kwargs={"ss_name": f"{round_count}_before", "local_save_dir": task_dir}
             )
@@ -34,5 +34,5 @@ # do a `tap` action on the screen
 ## TODO
 - add android app operation assistant under `examples/android_assistant`
 - migrate roles/actions of werewolf game from old version into current version
-- migrate roles/actions of mincraft game from old version into current version
+- migrate roles/actions of minecraft game from old version into current version
 - migrate roles/actions of stanford_town game from old version into current version
diff --git a/metagpt/environment/__init__.py b/metagpt/environment/__init__.py
index 692672fa7..0621fff16 100644
--- a/metagpt/environment/__init__.py
+++ b/metagpt/environment/__init__.py
@@ -3,11 +3,10 @@
 # @Desc   :
 
 from metagpt.environment.base_env import Environment
-from metagpt.environment.android_env.android_env import AndroidEnv
-from metagpt.environment.mincraft_env.mincraft_env import MincraftExtEnv
-from metagpt.environment.werewolf_env.werewolf_env import WerewolfEnv
-from metagpt.environment.stanford_town_env.stanford_town_env import StanfordTownEnv
-from metagpt.environment.software_env.software_env import SoftwareEnv
+from metagpt.environment.android.android_env import AndroidEnv
+from metagpt.environment.werewolf.werewolf_env import WerewolfEnv
+from metagpt.environment.stanford_town.stanford_town_env import StanfordTownEnv
+from metagpt.environment.software.software_env import SoftwareEnv
 
 
-__all__ = ["AndroidEnv", "MincraftExtEnv", "WerewolfEnv", "StanfordTownEnv", "SoftwareEnv", "Environment"]
+__all__ = ["AndroidEnv", "WerewolfEnv", "StanfordTownEnv", "SoftwareEnv", "Environment"]
diff --git a/metagpt/environment/mincraft_env/__init__.py b/metagpt/environment/android/__init__.py
similarity index 100%
rename from metagpt/environment/mincraft_env/__init__.py
rename to metagpt/environment/android/__init__.py
diff --git a/metagpt/environment/android_env/android_env.py b/metagpt/environment/android/android_env.py
similarity index 83%
rename from metagpt/environment/android_env/android_env.py
rename to metagpt/environment/android/android_env.py
index c27e20541..b3227df0f 100644
--- a/metagpt/environment/android_env/android_env.py
+++ b/metagpt/environment/android/android_env.py
@@ -4,7 +4,7 @@
 
 from pydantic import Field
 
-from metagpt.environment.android_env.android_ext_env import AndroidExtEnv
+from metagpt.environment.android.android_ext_env import AndroidExtEnv
 from metagpt.environment.base_env import Environment
 
 
diff --git a/metagpt/environment/android_env/android_ext_env.py b/metagpt/environment/android/android_ext_env.py
similarity index 91%
rename from metagpt/environment/android_env/android_ext_env.py
rename to metagpt/environment/android/android_ext_env.py
index b81b2cd26..d2344fa1f 100644
--- a/metagpt/environment/android_env/android_ext_env.py
+++ b/metagpt/environment/android/android_ext_env.py
@@ -8,8 +8,9 @@ from typing import Any, Optional
 
 from pydantic import Field
 
-from metagpt.environment.android_env.const import ADB_EXEC_FAIL
+from metagpt.environment.android.const import ADB_EXEC_FAIL
 from metagpt.environment.base_env import ExtEnv, mark_as_readable, mark_as_writeable
+from metagpt.environment.base_env_space import BaseEnvAction, BaseEnvObsParams
 
 
 class AndroidExtEnv(ExtEnv):
@@ -19,6 +20,20 @@ class AndroidExtEnv(ExtEnv):
     width: int = Field(default=720, description="device screen width")
     height: int = Field(default=1080, description="device screen height")
 
+    def reset(
+        self,
+        *,
+        seed: Optional[int] = None,
+        options: Optional[dict[str, Any]] = None,
+    ) -> tuple[dict[str, Any], dict[str, Any]]:
+        pass
+
+    def observe(self, obs_params: Optional[BaseEnvObsParams] = None) -> Any:
+        pass
+
+    def step(self, action: BaseEnvAction) -> tuple[dict[str, Any], float, bool, bool, dict[str, Any]]:
+        pass
+
     def __init__(self, **data: Any):
         super().__init__(**data)
         if data.get("device_id"):
diff --git a/metagpt/environment/android_env/const.py b/metagpt/environment/android/const.py
similarity index 100%
rename from metagpt/environment/android_env/const.py
rename to metagpt/environment/android/const.py
diff --git a/metagpt/environment/base_env.py b/metagpt/environment/base_env.py
index 0e583ffb3..024c46877 100644
--- a/metagpt/environment/base_env.py
+++ b/metagpt/environment/base_env.py
@@ -3,9 +3,12 @@
 # @Desc   : base env of executing environment
 
 import asyncio
+from abc import abstractmethod
 from enum import Enum
 from typing import TYPE_CHECKING, Any, Dict, Iterable, Optional, Set, Union
 
+from gymnasium import spaces
+from gymnasium.core import ActType, ObsType
 from pydantic import BaseModel, ConfigDict, Field, SerializeAsAny, model_validator
 
 from metagpt.context import Context
@@ -14,6 +17,7 @@ from metagpt.environment.api.env_api import (
     ReadAPIRegistry,
     WriteAPIRegistry,
 )
+from metagpt.environment.base_env_space import BaseEnvAction, BaseEnvObsParams
 from metagpt.logs import logger
 from metagpt.schema import Message
 from metagpt.utils.common import get_function_schema, is_coroutine_func, is_send_to
@@ -26,7 +30,7 @@ class EnvType(Enum):
     ANDROID = "Android"
     GYM = "Gym"
     WEREWOLF = "Werewolf"
-    MINCRAFT = "Mincraft"
+    MINECRAFT = "Minecraft"
     STANFORDTOWN = "StanfordTown"
 
 
@@ -47,7 +51,12 @@ def mark_as_writeable(func):
 
 
 class ExtEnv(BaseModel):
-    """External Env to intergate actual game environment"""
+    """External Env to integrate actual game environment"""
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+
+    action_space: spaces.Space[ActType] = Field(default_factory=spaces.Space, exclude=True)
+    observation_space: spaces.Space[ObsType] = Field(default_factory=spaces.Space, exclude=True)
 
     def _check_api_exist(self, rw_api: Optional[str] = None):
         if not rw_api:
@@ -61,39 +70,56 @@ class ExtEnv(BaseModel):
         else:
             return env_write_api_registry.get_apis()
 
-    async def observe(self, env_action: Union[str, EnvAPIAbstract]):
+    async def read_from_api(self, env_action: Union[str, EnvAPIAbstract]):
         """get observation from particular api of ExtEnv"""
         if isinstance(env_action, str):
-            read_api = env_read_api_registry.get(api_name=env_action)["func"]
-            self._check_api_exist(read_api)
-            if is_coroutine_func(read_api):
-                res = await read_api(self)
+            env_read_api = env_read_api_registry.get(api_name=env_action)["func"]
+            self._check_api_exist(env_read_api)
+            if is_coroutine_func(env_read_api):
+                res = await env_read_api(self)
             else:
-                res = read_api(self)
+                res = env_read_api(self)
         elif isinstance(env_action, EnvAPIAbstract):
-            read_api = env_read_api_registry.get(api_name=env_action.api_name)["func"]
-            self._check_api_exist(read_api)
-            if is_coroutine_func(read_api):
-                res = await read_api(self, *env_action.args, **env_action.kwargs)
+            env_read_api = env_read_api_registry.get(api_name=env_action.api_name)["func"]
+            self._check_api_exist(env_read_api)
+            if is_coroutine_func(env_read_api):
+                res = await env_read_api(self, *env_action.args, **env_action.kwargs)
             else:
-                res = read_api(self, *env_action.args, **env_action.kwargs)
+                res = env_read_api(self, *env_action.args, **env_action.kwargs)
         return res
 
-    async def step(self, env_action: Union[str, Message, EnvAPIAbstract, list[EnvAPIAbstract]]):
+    async def write_thru_api(self, env_action: Union[str, Message, EnvAPIAbstract, list[EnvAPIAbstract]]):
         """execute through particular api of ExtEnv"""
         res = None
         if isinstance(env_action, Message):
             self.publish_message(env_action)
         elif isinstance(env_action, EnvAPIAbstract):
-            write_api = env_write_api_registry.get(env_action.api_name)["func"]
-            self._check_api_exist(write_api)
-            if is_coroutine_func(write_api):
-                res = await write_api(self, *env_action.args, **env_action.kwargs)
+            env_write_api = env_write_api_registry.get(env_action.api_name)["func"]
+            self._check_api_exist(env_write_api)
+            if is_coroutine_func(env_write_api):
+                res = await env_write_api(self, *env_action.args, **env_action.kwargs)
             else:
-                res = write_api(self, *env_action.args, **env_action.kwargs)
+                res = env_write_api(self, *env_action.args, **env_action.kwargs)
 
         return res
 
+    @abstractmethod
+    def reset(
+        self,
+        *,
+        seed: Optional[int] = None,
+        options: Optional[dict[str, Any]] = None,
+    ) -> tuple[dict[str, Any], dict[str, Any]]:
+        """Implement this to get init observation"""
+
+    @abstractmethod
+    def observe(self, obs_params: Optional[BaseEnvObsParams] = None) -> Any:
+        """Implement this if you want to get partial observation from the env"""
+
+    @abstractmethod
+    def step(self, action: BaseEnvAction) -> tuple[dict[str, Any], float, bool, bool, dict[str, Any]]:
+        """Implement this to feed a action and then get new observation from the env"""
+
 
 class Environment(ExtEnv):
     """环境，承载一批角色，角色可以向环境发布消息，可以被其他角色观察到
@@ -108,6 +134,20 @@ class Environment(ExtEnv):
     history: str = ""  # For debug
     context: Context = Field(default_factory=Context, exclude=True)
 
+    def reset(
+        self,
+        *,
+        seed: Optional[int] = None,
+        options: Optional[dict[str, Any]] = None,
+    ) -> tuple[dict[str, Any], dict[str, Any]]:
+        pass
+
+    def observe(self, obs_params: Optional[BaseEnvObsParams] = None) -> Any:
+        pass
+
+    def step(self, action: BaseEnvAction) -> tuple[dict[str, Any], float, bool, bool, dict[str, Any]]:
+        pass
+
     @model_validator(mode="after")
     def init_roles(self):
         self.add_roles(self.roles.values())
@@ -129,8 +169,8 @@ class Environment(ExtEnv):
             self.roles[role.profile] = role
 
         for role in roles:  # setup system message with roles
-            role.set_env(self)
             role.context = self.context
+            role.set_env(self)
 
     def publish_message(self, message: Message, peekable: bool = True) -> bool:
         """
diff --git a/metagpt/environment/base_env_space.py b/metagpt/environment/base_env_space.py
new file mode 100644
index 000000000..fd0cfa399
--- /dev/null
+++ b/metagpt/environment/base_env_space.py
@@ -0,0 +1,33 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
+
+from enum import IntEnum
+
+from pydantic import BaseModel, ConfigDict, Field
+
+
+class BaseEnvActionType(IntEnum):
+    # # NONE = 0  # no action to run, just get observation
+    pass
+
+
+class BaseEnvAction(BaseModel):
+    """env action type and its related params of action functions/apis"""
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+
+    action_type: int = Field(default=0, description="action type")
+
+
+class BaseEnvObsType(IntEnum):
+    # # NONE = 0                     # get whole observation from env
+    pass
+
+
+class BaseEnvObsParams(BaseModel):
+    """observation params for different EnvObsType to get its observe result"""
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+
+    obs_type: int = Field(default=0, description="observation type")
diff --git a/metagpt/environment/software_env/__init__.py b/metagpt/environment/minecraft/__init__.py
similarity index 100%
rename from metagpt/environment/software_env/__init__.py
rename to metagpt/environment/minecraft/__init__.py
diff --git a/metagpt/environment/mincraft_env/const.py b/metagpt/environment/minecraft/const.py
similarity index 92%
rename from metagpt/environment/mincraft_env/const.py
rename to metagpt/environment/minecraft/const.py
index a7222f9cd..8ac15decc 100644
--- a/metagpt/environment/mincraft_env/const.py
+++ b/metagpt/environment/minecraft/const.py
@@ -4,8 +4,8 @@
 
 from metagpt.const import METAGPT_ROOT
 
-# For Mincraft Game Agent
-MC_CKPT_DIR = METAGPT_ROOT / "data/mincraft/ckpt"
+# For Minecraft Game Agent
+MC_CKPT_DIR = METAGPT_ROOT / "data/minecraft/ckpt"
 MC_LOG_DIR = METAGPT_ROOT / "logs"
 MC_DEFAULT_WARMUP = {
     "context": 15,
diff --git a/metagpt/environment/mincraft_env/mincraft_env.py b/metagpt/environment/minecraft/minecraft_env.py
similarity index 93%
rename from metagpt/environment/mincraft_env/mincraft_env.py
rename to metagpt/environment/minecraft/minecraft_env.py
index 6327aa3f4..0f39c9ccd 100644
--- a/metagpt/environment/mincraft_env/mincraft_env.py
+++ b/metagpt/environment/minecraft/minecraft_env.py
@@ -1,6 +1,6 @@
 #!/usr/bin/env python
 # -*- coding: utf-8 -*-
-# @Desc   : MG Mincraft Env
+# @Desc   : MG Minecraft Env
 #           refs to `voyager voyager.py`
 
 import json
@@ -8,20 +8,19 @@ import re
 import time
 from typing import Any, Iterable
 
-from langchain.embeddings.openai import OpenAIEmbeddings
-from langchain.vectorstores import Chroma
+from llama_index.vector_stores.chroma import ChromaVectorStore
 from pydantic import ConfigDict, Field
 
 from metagpt.config2 import config as CONFIG
 from metagpt.environment.base_env import Environment
-from metagpt.environment.mincraft_env.const import MC_CKPT_DIR
-from metagpt.environment.mincraft_env.mincraft_ext_env import MincraftExtEnv
+from metagpt.environment.minecraft.const import MC_CKPT_DIR
+from metagpt.environment.minecraft.minecraft_ext_env import MinecraftExtEnv
 from metagpt.logs import logger
 from metagpt.utils.common import load_mc_skills_code, read_json_file, write_json_file
 
 
-class MincraftEnv(Environment, MincraftExtEnv):
-    """MincraftEnv, including shared memory of cache and infomation between roles"""
+class MinecraftEnv(Environment, MinecraftExtEnv):
+    """MinecraftEnv, including shared memory of cache and information between roles"""
 
     model_config = ConfigDict(arbitrary_types_allowed=True)
 
@@ -48,9 +47,9 @@ class MincraftEnv(Environment, MincraftExtEnv):
 
     runtime_status: bool = False  # equal to action execution status: success or failed
 
-    vectordb: Chroma = Field(default_factory=Chroma)
+    vectordb: ChromaVectorStore = Field(default_factory=ChromaVectorStore)
 
-    qa_cache_questions_vectordb: Chroma = Field(default_factory=Chroma)
+    qa_cache_questions_vectordb: ChromaVectorStore = Field(default_factory=ChromaVectorStore)
 
     @property
     def progress(self):
@@ -73,16 +72,14 @@ class MincraftEnv(Environment, MincraftExtEnv):
         self.set_mc_resume()
 
     def set_mc_resume(self):
-        self.qa_cache_questions_vectordb = Chroma(
+        self.qa_cache_questions_vectordb = ChromaVectorStore(
             collection_name="qa_cache_questions_vectordb",
-            embedding_function=OpenAIEmbeddings(),
-            persist_directory=f"{MC_CKPT_DIR}/curriculum/vectordb",
+            persist_dir=f"{MC_CKPT_DIR}/curriculum/vectordb",
         )
 
-        self.vectordb = Chroma(
+        self.vectordb = ChromaVectorStore(
             collection_name="skill_vectordb",
-            embedding_function=OpenAIEmbeddings(),
-            persist_directory=f"{MC_CKPT_DIR}/skill/vectordb",
+            persist_dir=f"{MC_CKPT_DIR}/skill/vectordb",
         )
 
         if CONFIG.resume:
@@ -285,7 +282,7 @@ class MincraftEnv(Environment, MincraftExtEnv):
                     position = event["status"]["position"]
                     blocks.append(block)
                     positions.append(position)
-            new_events = self.step(
+            new_events = self._step(
                 f"await givePlacedItemBack(bot, {json.dumps(blocks)}, {json.dumps(positions)})",
                 programs=self.programs,
             )
@@ -326,7 +323,7 @@ class MincraftEnv(Environment, MincraftExtEnv):
                 Exception: If there is an issue retrieving events.
         """
         try:
-            self.reset(
+            self._reset(
                 options={
                     "mode": "soft",
                     "wait_ticks": 20,
@@ -335,13 +332,13 @@ class MincraftEnv(Environment, MincraftExtEnv):
             # difficulty = "easy" if len(self.completed_tasks) > 15 else "peaceful"
             difficulty = "peaceful"
 
-            events = self.step("bot.chat(`/time set ${getNextTime()}`);\n" + f"bot.chat('/difficulty {difficulty}');")
+            events = self._step("bot.chat(`/time set ${getNextTime()}`);\n" + f"bot.chat('/difficulty {difficulty}');")
             self.update_event(events)
             return events
         except Exception as e:
             time.sleep(3)  # wait for mineflayer to exit
             # reset bot status here
-            events = self.reset(
+            events = self._reset(
                 options={
                     "mode": "hard",
                     "wait_ticks": 20,
@@ -368,7 +365,7 @@ class MincraftEnv(Environment, MincraftExtEnv):
                 Exception: If there is an issue retrieving events.
         """
         try:
-            events = self.step(
+            events = self._step(
                 code=self.code,
                 programs=self.programs,
             )
@@ -377,7 +374,7 @@ class MincraftEnv(Environment, MincraftExtEnv):
         except Exception as e:
             time.sleep(3)  # wait for mineflayer to exit
             # reset bot status here
-            events = self.reset(
+            events = self._reset(
                 options={
                     "mode": "hard",
                     "wait_ticks": 20,
diff --git a/metagpt/environment/mincraft_env/mincraft_ext_env.py b/metagpt/environment/minecraft/minecraft_ext_env.py
similarity index 87%
rename from metagpt/environment/mincraft_env/mincraft_ext_env.py
rename to metagpt/environment/minecraft/minecraft_ext_env.py
index b86250d8c..0436bc3aa 100644
--- a/metagpt/environment/mincraft_env/mincraft_ext_env.py
+++ b/metagpt/environment/minecraft/minecraft_ext_env.py
@@ -1,28 +1,29 @@
 #!/usr/bin/env python
 # -*- coding: utf-8 -*-
-# @Desc   : The Mincraft external environment to integrate with Mincraft game
+# @Desc   : The Minecraft external environment to integrate with Minecraft game
 #           refs to `voyager bridge.py`
 
 import json
 import time
-from typing import Optional
+from typing import Any, Optional
 
 import requests
 from pydantic import ConfigDict, Field, model_validator
 
 from metagpt.environment.base_env import ExtEnv, mark_as_writeable
-from metagpt.environment.mincraft_env.const import (
+from metagpt.environment.base_env_space import BaseEnvAction, BaseEnvObsParams
+from metagpt.environment.minecraft.const import (
     MC_CKPT_DIR,
     MC_CORE_INVENTORY_ITEMS,
     MC_CURRICULUM_OB,
     MC_DEFAULT_WARMUP,
     METAGPT_ROOT,
 )
-from metagpt.environment.mincraft_env.process_monitor import SubprocessMonitor
+from metagpt.environment.minecraft.process_monitor import SubprocessMonitor
 from metagpt.logs import logger
 
 
-class MincraftExtEnv(ExtEnv):
+class MinecraftExtEnv(ExtEnv):
     model_config = ConfigDict(arbitrary_types_allowed=True)
 
     mc_port: Optional[int] = Field(default=None)
@@ -38,6 +39,20 @@ class MincraftExtEnv(ExtEnv):
     server_paused: bool = Field(default=False)
     warm_up: dict = Field(default=dict())
 
+    def reset(
+        self,
+        *,
+        seed: Optional[int] = None,
+        options: Optional[dict[str, Any]] = None,
+    ) -> tuple[dict[str, Any], dict[str, Any]]:
+        pass
+
+    def observe(self, obs_params: Optional[BaseEnvObsParams] = None) -> Any:
+        pass
+
+    def step(self, action: BaseEnvAction) -> tuple[dict[str, Any], float, bool, bool, dict[str, Any]]:
+        pass
+
     @property
     def server(self) -> str:
         return f"{self.server_host}:{self.server_port}"
@@ -48,7 +63,7 @@ class MincraftExtEnv(ExtEnv):
             self.mineflayer = SubprocessMonitor(
                 commands=[
                     "node",
-                    METAGPT_ROOT.joinpath("metagpt", "environment", "mincraft_env", "mineflayer", "index.js"),
+                    METAGPT_ROOT.joinpath("metagpt", "environment", "minecraft", "mineflayer", "index.js"),
                     str(self.server_port),
                 ],
                 name="mineflayer",
@@ -115,7 +130,7 @@ class MincraftExtEnv(ExtEnv):
             return res.json()
 
     @mark_as_writeable
-    def reset(self, *, seed=None, options=None) -> dict:
+    def _reset(self, *, seed=None, options=None) -> dict:
         if options is None:
             options = {}
         if options.get("inventory", {}) and options.get("mode", "hard") != "hard":
@@ -145,7 +160,7 @@ class MincraftExtEnv(ExtEnv):
         return json.loads(returned_data)
 
     @mark_as_writeable
-    def step(self, code: str, programs: str = "") -> dict:
+    def _step(self, code: str, programs: str = "") -> dict:
         if not self.has_reset:
             raise RuntimeError("Environment has not been reset yet")
         self.check_process()
diff --git a/metagpt/environment/mincraft_env/mineflayer/.gitignore b/metagpt/environment/minecraft/mineflayer/.gitignore
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/.gitignore
rename to metagpt/environment/minecraft/mineflayer/.gitignore
diff --git a/metagpt/environment/mincraft_env/mineflayer/.prettierignore b/metagpt/environment/minecraft/mineflayer/.prettierignore
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/.prettierignore
rename to metagpt/environment/minecraft/mineflayer/.prettierignore
diff --git a/metagpt/environment/mincraft_env/mineflayer/.prettierrc.json b/metagpt/environment/minecraft/mineflayer/.prettierrc.json
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/.prettierrc.json
rename to metagpt/environment/minecraft/mineflayer/.prettierrc.json
diff --git a/metagpt/environment/mincraft_env/mineflayer/index.js b/metagpt/environment/minecraft/mineflayer/index.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/index.js
rename to metagpt/environment/minecraft/mineflayer/index.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/lib/observation/base.js b/metagpt/environment/minecraft/mineflayer/lib/observation/base.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/lib/observation/base.js
rename to metagpt/environment/minecraft/mineflayer/lib/observation/base.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/lib/observation/chests.js b/metagpt/environment/minecraft/mineflayer/lib/observation/chests.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/lib/observation/chests.js
rename to metagpt/environment/minecraft/mineflayer/lib/observation/chests.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/lib/observation/inventory.js b/metagpt/environment/minecraft/mineflayer/lib/observation/inventory.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/lib/observation/inventory.js
rename to metagpt/environment/minecraft/mineflayer/lib/observation/inventory.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/lib/observation/onChat.js b/metagpt/environment/minecraft/mineflayer/lib/observation/onChat.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/lib/observation/onChat.js
rename to metagpt/environment/minecraft/mineflayer/lib/observation/onChat.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/lib/observation/onError.js b/metagpt/environment/minecraft/mineflayer/lib/observation/onError.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/lib/observation/onError.js
rename to metagpt/environment/minecraft/mineflayer/lib/observation/onError.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/lib/observation/onSave.js b/metagpt/environment/minecraft/mineflayer/lib/observation/onSave.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/lib/observation/onSave.js
rename to metagpt/environment/minecraft/mineflayer/lib/observation/onSave.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/lib/observation/status.js b/metagpt/environment/minecraft/mineflayer/lib/observation/status.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/lib/observation/status.js
rename to metagpt/environment/minecraft/mineflayer/lib/observation/status.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/lib/observation/voxels.js b/metagpt/environment/minecraft/mineflayer/lib/observation/voxels.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/lib/observation/voxels.js
rename to metagpt/environment/minecraft/mineflayer/lib/observation/voxels.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/lib/skillLoader.js b/metagpt/environment/minecraft/mineflayer/lib/skillLoader.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/lib/skillLoader.js
rename to metagpt/environment/minecraft/mineflayer/lib/skillLoader.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/lib/utils.js b/metagpt/environment/minecraft/mineflayer/lib/utils.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/lib/utils.js
rename to metagpt/environment/minecraft/mineflayer/lib/utils.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/.gitignore b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/.gitignore
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/.gitignore
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/.gitignore
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/LICENSE b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/LICENSE
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/LICENSE
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/LICENSE
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/README.md b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/README.md
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/README.md
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/README.md
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/_config.yml b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/_config.yml
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/_config.yml
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/_config.yml
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/docs/api.md b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/docs/api.md
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/docs/api.md
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/docs/api.md
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/examples/collector.js b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/examples/collector.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/examples/collector.js
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/examples/collector.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/examples/oreMiner.js b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/examples/oreMiner.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/examples/oreMiner.js
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/examples/oreMiner.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/examples/storageBot.js b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/examples/storageBot.js
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/examples/storageBot.js
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/examples/storageBot.js
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/package.json b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/package.json
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/package.json
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/package.json
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/BlockVeins.ts b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/BlockVeins.ts
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/BlockVeins.ts
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/BlockVeins.ts
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/CollectBlock.ts b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/CollectBlock.ts
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/CollectBlock.ts
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/CollectBlock.ts
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/Inventory.ts b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/Inventory.ts
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/Inventory.ts
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/Inventory.ts
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/Targets.ts b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/Targets.ts
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/Targets.ts
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/Targets.ts
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/TaskQueue.ts b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/TaskQueue.ts
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/TaskQueue.ts
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/TaskQueue.ts
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/TemporarySubscriber.ts b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/TemporarySubscriber.ts
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/TemporarySubscriber.ts
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/TemporarySubscriber.ts
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/Util.ts b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/Util.ts
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/Util.ts
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/Util.ts
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/index.ts b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/index.ts
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/src/index.ts
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/src/index.ts
diff --git a/metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/tsconfig.json b/metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/tsconfig.json
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/mineflayer-collectblock/tsconfig.json
rename to metagpt/environment/minecraft/mineflayer/mineflayer-collectblock/tsconfig.json
diff --git a/metagpt/environment/mincraft_env/mineflayer/package.json b/metagpt/environment/minecraft/mineflayer/package.json
similarity index 100%
rename from metagpt/environment/mincraft_env/mineflayer/package.json
rename to metagpt/environment/minecraft/mineflayer/package.json
diff --git a/metagpt/environment/mincraft_env/process_monitor.py b/metagpt/environment/minecraft/process_monitor.py
similarity index 100%
rename from metagpt/environment/mincraft_env/process_monitor.py
rename to metagpt/environment/minecraft/process_monitor.py
diff --git a/metagpt/environment/stanford_town_env/__init__.py b/metagpt/environment/software/__init__.py
similarity index 100%
rename from metagpt/environment/stanford_town_env/__init__.py
rename to metagpt/environment/software/__init__.py
diff --git a/metagpt/environment/software_env/software_env.py b/metagpt/environment/software/software_env.py
similarity index 100%
rename from metagpt/environment/software_env/software_env.py
rename to metagpt/environment/software/software_env.py
diff --git a/metagpt/environment/werewolf_env/__init__.py b/metagpt/environment/stanford_town/__init__.py
similarity index 100%
rename from metagpt/environment/werewolf_env/__init__.py
rename to metagpt/environment/stanford_town/__init__.py
diff --git a/metagpt/environment/stanford_town/env_space.py b/metagpt/environment/stanford_town/env_space.py
new file mode 100644
index 000000000..e100a2952
--- /dev/null
+++ b/metagpt/environment/stanford_town/env_space.py
@@ -0,0 +1,105 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
+
+from typing import Any, Optional, Union
+
+import numpy as np
+import numpy.typing as npt
+from gymnasium import spaces
+from pydantic import ConfigDict, Field, field_validator
+
+from metagpt.environment.base_env_space import (
+    BaseEnvAction,
+    BaseEnvActionType,
+    BaseEnvObsParams,
+    BaseEnvObsType,
+)
+
+
+class EnvActionType(BaseEnvActionType):
+    NONE = 0  # no action to run, just get observation
+
+    ADD_TILE_EVENT = 1  # Add an event triple to a tile
+    RM_TILE_EVENT = 2  # Remove an event triple from a tile
+    TURN_TILE_EVENT_IDLE = 3  # Turn an event triple from a tile into idle
+    RM_TITLE_SUB_EVENT = 4  # Remove an event triple that has the input subject from a tile
+
+
+class EnvAction(BaseEnvAction):
+    """env action type and its related params of action functions/apis"""
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+
+    action_type: int = Field(default=EnvActionType.NONE, description="action type")
+    coord: npt.NDArray[np.int64] = Field(
+        default_factory=lambda: np.zeros(2, dtype=np.int64), description="tile coordinate"
+    )
+    subject: str = Field(default="", description="subject name of first element in event")
+    event: tuple[str, Optional[str], Optional[str], Optional[str]] = Field(
+        default=["", None, None, None], description="tile event"
+    )
+
+    @field_validator("coord", mode="before")
+    @classmethod
+    def check_coord(cls, coord) -> npt.NDArray[np.int64]:
+        if not isinstance(coord, np.ndarray):
+            return np.array(coord)
+
+
+class EnvObsType(BaseEnvObsType):
+    """get part observation with specific params"""
+
+    NONE = 0  # get whole observation from env
+
+    GET_TITLE = 1  # get the tile detail dictionary with given tile coord
+    TILE_PATH = 2  # get the tile address with given tile coord
+    TILE_NBR = 3  # get the neighbors of given tile coord and its vision radius
+
+
+class EnvObsParams(BaseEnvObsParams):
+    """observation params for different EnvObsType"""
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+
+    obs_type: int = Field(default=EnvObsType.NONE, description="observation type")
+    coord: npt.NDArray[np.int64] = Field(
+        default_factory=lambda: np.zeros(2, dtype=np.int64), description="tile coordinate"
+    )
+    level: str = Field(default="", description="different level of title")
+    vision_radius: int = Field(default=0, description="the vision radius of current tile")
+
+    @field_validator("coord", mode="before")
+    @classmethod
+    def check_coord(cls, coord) -> npt.NDArray[np.int64]:
+        if not isinstance(coord, np.ndarray):
+            return np.array(coord)
+
+
+EnvObsValType = Union[list[list[str]], dict[str, set[tuple[int, int]]], list[list[dict[str, Any]]]]
+
+
+def get_observation_space() -> spaces.Dict:
+    # it's a
+    space = spaces.Dict(
+        {"collision_maze": spaces.Discrete(2), "tiles": spaces.Discrete(2), "address_tiles": spaces.Discrete(2)}
+    )
+
+    return space
+
+
+def get_action_space(maze_shape: tuple[int, int]) -> spaces.Dict:
+    """The fields defined by the space correspond to the input parameters of the action except `action_type`"""
+    space = spaces.Dict(
+        {
+            "action_type": spaces.Discrete(len(EnvActionType)),
+            "coord": spaces.Box(
+                np.array([0, 0], dtype=np.int64), np.array([maze_shape[0], maze_shape[1]], dtype=np.int64)
+            ),  # coord of the tile
+            "subject": spaces.Text(256),  # the first element of an tile event
+            "event": spaces.Tuple(
+                (spaces.Text(256), spaces.Text(256), spaces.Text(256), spaces.Text(256))
+            ),  # event is a tuple of four str
+        }
+    )
+    return space
diff --git a/metagpt/environment/stanford_town/stanford_town_env.py b/metagpt/environment/stanford_town/stanford_town_env.py
new file mode 100644
index 000000000..af8a882b2
--- /dev/null
+++ b/metagpt/environment/stanford_town/stanford_town_env.py
@@ -0,0 +1,10 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : MG StanfordTown Env
+
+from metagpt.environment.base_env import Environment
+from metagpt.environment.stanford_town.stanford_town_ext_env import StanfordTownExtEnv
+
+
+class StanfordTownEnv(StanfordTownExtEnv, Environment):
+    pass
diff --git a/metagpt/environment/stanford_town_env/stanford_town_ext_env.py b/metagpt/environment/stanford_town/stanford_town_ext_env.py
similarity index 83%
rename from metagpt/environment/stanford_town_env/stanford_town_ext_env.py
rename to metagpt/environment/stanford_town/stanford_town_ext_env.py
index 8a9a65965..30a02d4db 100644
--- a/metagpt/environment/stanford_town_env/stanford_town_ext_env.py
+++ b/metagpt/environment/stanford_town/stanford_town_ext_env.py
@@ -5,11 +5,20 @@
 
 import math
 from pathlib import Path
-from typing import Optional, Tuple
+from typing import Any, Optional
 
 from pydantic import ConfigDict, Field, model_validator
 
 from metagpt.environment.base_env import ExtEnv, mark_as_readable, mark_as_writeable
+from metagpt.environment.stanford_town.env_space import (
+    EnvAction,
+    EnvActionType,
+    EnvObsParams,
+    EnvObsType,
+    EnvObsValType,
+    get_action_space,
+    get_observation_space,
+)
 from metagpt.utils.common import read_csv_to_list, read_json_file
 
 
@@ -197,15 +206,82 @@ class StanfordTownExtEnv(ExtEnv):
                     else:
                         address_tiles[add] = set([(j, i)])
         values["address_tiles"] = address_tiles
+
+        values["action_space"] = get_action_space((maze_width, maze_height))
+        values["observation_space"] = get_observation_space()
         return values
 
+    def reset(
+        self,
+        *,
+        seed: Optional[int] = None,
+        options: Optional[dict[str, Any]] = None,
+    ) -> tuple[dict[str, EnvObsValType], dict[str, Any]]:
+        """reset env and get the init observation
+        Return results corresponding to `observation, info`
+        """
+        super().reset(seed=seed, options=options)
+
+        obs = self._get_obs()
+
+        return obs, {}
+
+    def _get_obs(self) -> dict[str, EnvObsValType]:
+        """Get observation"""
+        return {
+            "collision_maze": self.get_collision_maze(),
+            "tiles": self.tiles,
+            "address_tiles": self.get_address_tiles(),
+        }
+
+    def observe(self, obs_params: Optional[EnvObsParams] = None) -> Any:
+        """Get partial or full observation from the env"""
+        obs_type = obs_params.obs_type if obs_params else EnvObsType.NONE
+        if obs_type == EnvObsType.NONE:
+            obs = self._get_obs()
+        elif obs_type == EnvObsType.GET_TITLE:
+            obs = self.access_tile(tile=obs_params.coord)
+        elif obs_type == EnvObsType.TILE_PATH:
+            obs = self.get_tile_path(tile=obs_params.coord, level=obs_params.level)
+        elif obs_type == EnvObsType.TILE_NBR:
+            obs = self.get_nearby_tiles(tile=obs_params.coord, vision_r=obs_params.vision_radius)
+        return obs
+
+    def step(self, action: EnvAction) -> tuple[dict[str, EnvObsValType], float, bool, bool, dict[str, Any]]:
+        """Execute action and then return observation
+        Return results corresponding to `observation, reward, terminated, truncated, info`
+        """
+        terminated = False
+        try:
+            self._execute_env_action(action)
+        except Exception:
+            terminated = True
+
+        obs = self._get_obs()
+
+        ret = (obs, 1.0, terminated, False, {})
+        return ret
+
+    def _execute_env_action(self, action: EnvAction):
+        action_type = action.action_type
+        if action_type == EnvActionType.NONE:
+            pass
+        elif action_type == EnvActionType.ADD_TILE_EVENT:
+            self.add_event_from_tile(curr_event=action.event, tile=action.coord)
+        elif action_type == EnvActionType.RM_TILE_EVENT:
+            self.remove_event_from_tile(curr_event=action.event, tile=action.coord)
+        elif action_type == EnvActionType.TURN_TILE_EVENT_IDLE:
+            self.turn_event_from_tile_idle(curr_event=action.event, tile=action.coord)
+        elif action_type == EnvActionType.RM_TITLE_SUB_EVENT:
+            self.remove_subject_events_from_tile(subject=action.subject, tile=action.coord)
+
     def turn_coordinate_to_tile(self, px_coordinate: tuple[int, int]) -> tuple[int, int]:
         """
         Turns a pixel coordinate to a tile coordinate.
         """
         x = math.ceil(px_coordinate[0] / self.sq_tile_size)
         y = math.ceil(px_coordinate[1] / self.sq_tile_size)
-        return (x, y)
+        return x, y
 
     @mark_as_readable
     def get_collision_maze(self) -> list:
@@ -316,10 +392,6 @@ class StanfordTownExtEnv(ExtEnv):
                 nearby_tiles += [(i, j)]
         return nearby_tiles
 
-    @mark_as_writeable
-    def add_tiles_event(self, pt_y: int, pt_x: int, event: Tuple[str, str, str, str]):
-        self.tiles[pt_y][pt_x]["events"].add(event)
-
     @mark_as_writeable
     def add_event_from_tile(self, curr_event: tuple[str], tile: tuple[int, int]) -> None:
         """
diff --git a/metagpt/environment/stanford_town_env/stanford_town_env.py b/metagpt/environment/stanford_town_env/stanford_town_env.py
deleted file mode 100644
index 8721d6cd1..000000000
--- a/metagpt/environment/stanford_town_env/stanford_town_env.py
+++ /dev/null
@@ -1,12 +0,0 @@
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-# @Desc   : MG StanfordTown Env
-
-from metagpt.environment.base_env import Environment
-from metagpt.environment.stanford_town_env.stanford_town_ext_env import (
-    StanfordTownExtEnv,
-)
-
-
-class StanfordTownEnv(Environment, StanfordTownExtEnv):
-    pass
diff --git a/tests/metagpt/environment/mincraft_env/__init__.py b/metagpt/environment/werewolf/__init__.py
similarity index 100%
rename from tests/metagpt/environment/mincraft_env/__init__.py
rename to metagpt/environment/werewolf/__init__.py
diff --git a/metagpt/environment/werewolf_env/werewolf_env.py b/metagpt/environment/werewolf/werewolf_env.py
similarity index 93%
rename from metagpt/environment/werewolf_env/werewolf_env.py
rename to metagpt/environment/werewolf/werewolf_env.py
index d174f322c..e22d9c46f 100644
--- a/metagpt/environment/werewolf_env/werewolf_env.py
+++ b/metagpt/environment/werewolf/werewolf_env.py
@@ -5,7 +5,7 @@
 from pydantic import Field
 
 from metagpt.environment.base_env import Environment
-from metagpt.environment.werewolf_env.werewolf_ext_env import WerewolfExtEnv
+from metagpt.environment.werewolf.werewolf_ext_env import WerewolfExtEnv
 from metagpt.logs import logger
 from metagpt.schema import Message
 
diff --git a/metagpt/environment/werewolf_env/werewolf_ext_env.py b/metagpt/environment/werewolf/werewolf_ext_env.py
similarity index 96%
rename from metagpt/environment/werewolf_env/werewolf_ext_env.py
rename to metagpt/environment/werewolf/werewolf_ext_env.py
index 7c4b4c475..3f2508b06 100644
--- a/metagpt/environment/werewolf_env/werewolf_ext_env.py
+++ b/metagpt/environment/werewolf/werewolf_ext_env.py
@@ -5,11 +5,12 @@
 import random
 from collections import Counter
 from enum import Enum
-from typing import Callable, Optional
+from typing import Any, Callable, Optional
 
 from pydantic import ConfigDict, Field
 
 from metagpt.environment.base_env import ExtEnv, mark_as_readable, mark_as_writeable
+from metagpt.environment.base_env_space import BaseEnvAction, BaseEnvObsParams
 from metagpt.logs import logger
 
 
@@ -128,6 +129,20 @@ class WerewolfExtEnv(ExtEnv):
     player_poisoned: Optional[str] = Field(default=None)
     player_current_dead: list[str] = Field(default=[])
 
+    def reset(
+        self,
+        *,
+        seed: Optional[int] = None,
+        options: Optional[dict[str, Any]] = None,
+    ) -> tuple[dict[str, Any], dict[str, Any]]:
+        pass
+
+    def observe(self, obs_params: Optional[BaseEnvObsParams] = None) -> Any:
+        pass
+
+    def step(self, action: BaseEnvAction) -> tuple[dict[str, Any], float, bool, bool, dict[str, Any]]:
+        pass
+
     @property
     def living_players(self) -> list[str]:
         player_names = []
diff --git a/metagpt/ext/__init__.py b/metagpt/ext/__init__.py
new file mode 100644
index 000000000..2bcf8efd0
--- /dev/null
+++ b/metagpt/ext/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/metagpt/ext/stanford_town/README.md b/metagpt/ext/stanford_town/README.md
new file mode 100644
index 000000000..bfcb1c818
--- /dev/null
+++ b/metagpt/ext/stanford_town/README.md
@@ -0,0 +1,36 @@
+## Stanford Town Game
+
+### Pre-Description
+In order to facilitate GA( [generative_agents](https://github.com/joonspk-research/generative_agents) )'s frontend docking data (to avoid changing its code), you can set the value `temp_storage_path` to `temp_storage` of `generative_agents` when start `run_st_game.py`. like
+
+`python3 run_st_game.py --temp_storage_path path/to/ga/temp_storage xxx`  
+
+Or change the path under `const.py` like beflow  
+
+```
+STORAGE_PATH = EXAMPLE_PATH.joinpath("storage")
+TEMP_STORAGE_PATH = EXAMPLE_PATH.joinpath("temp_storage")
+# updated
+STORAGE_PATH = Path("{path/to/ga/storage}")
+TEMP_STORAGE_PATH = Path("{path/to/ga/temp_storage}")
+```
+
+This can be used to achieve docking of simulation data without changing the GA code. Otherwise, the GA code must be modified to adapt to the MG output path.  
+
+If you don't want to start from 0, copy other simulation directories under `generative_agents/environment/frontend_server/storage/` to `examples/stanford_town/storage`, and select a directory named `fork_sim_code`.  
+
+### Backend service startup
+The execution entry is `python3 run_st_game.py "Host a open lunch party at 13:00 pm" "base_the_ville_isabella_maria_klaus" "test_sim" 10`  
+or   
+`python3 run_st_game.py "Host a open lunch party at 13:00 pm" "base_the_ville_isabella_maria_klaus" "test_sim" 10 --temp_storage_path path/to/ga/temp_storage`  
+
+`idea` is the user's voice to the first Agent, and it is disseminated through this voice to see whether the final multi-agents achieve the goal of hosting or participating in the event.  
+
+### Frontend service startup
+Enter project folder `generative_agents`  
+
+Enter `environment/frontend_server` and use `python3 manage.py runserver` to start the front-end service.  
+Visit `http://localhost:8000/simulator_home` to enter the current simulation interface.  
+
+## Appreciation
+The reproduction work has referred the `https://github.com/joonspk-research/generative_agents`, let's make a general statement here.  
diff --git a/metagpt/ext/stanford_town/README_CN.md b/metagpt/ext/stanford_town/README_CN.md
new file mode 100644
index 000000000..c55a742fc
--- /dev/null
+++ b/metagpt/ext/stanford_town/README_CN.md
@@ -0,0 +1,35 @@
+## Stanford Town Game
+
+### 前置
+为了方便GA（ [generative_agents](https://github.com/joonspk-research/generative_agents) ）的前端对接数据（避免改动它那块的代码），可在启动`run_st_game.py`加上`temp_storage_path`指向`generative_agents`对应的`temp_storage`路径。比如
+
+`python3 run_st_game.py --temp_storage_path path/to/ga/temp_storage xxx`   
+
+或将`const.py`下的
+
+```
+STORAGE_PATH = EXAMPLE_PATH.joinpath("storage")
+TEMP_STORAGE_PATH = EXAMPLE_PATH.joinpath("temp_storage")
+# 更新为
+STORAGE_PATH = Path("{path/to/ga/storage}")
+TEMP_STORAGE_PATH = Path("{path/to/ga/temp_storage}")
+```
+这样可用实现不改变GA代码情况下，实现仿真数据的对接。不然得修改GA的代码来适配MG的输出路径。  
+
+如果你不想从0开始启动，拷贝`generative_agents/environment/frontend_server/storage/`下的其他仿真目录到`examples/stanford_town/storage`，并选择一个目录名作为`fork_sim_code`。  
+
+### 后端服务启动
+执行入口为：`python3 run_st_game.py "Host a open lunch party at 13:00 pm" "base_the_ville_isabella_maria_klaus" "test_sim" 10`  
+或者  
+`python3 run_st_game.py "Host a open lunch party at 13:00 pm" "base_the_ville_isabella_maria_klaus" "test_sim" 10 --temp_storage_path path/to/ga/temp_storage`
+
+`idea`为用户给第一个Agent的用户心声，并通过这个心声进行传播，看最后多智能体是否达到举办、参加活动的目标。  
+
+### 前端服务启动
+进入`generative_agents`项目目录
+
+进入`environment/frontend_server`，使用`python3 manage.py runserver`启动前端服务。  
+访问`http://localhost:8000/simulator_home` 进入当前的仿真界面。  
+
+## Appreciation
+The reproduction work has referred the `https://github.com/joonspk-research/generative_agents`, let's make a general statement here.
diff --git a/metagpt/ext/stanford_town/__init__.py b/metagpt/ext/stanford_town/__init__.py
new file mode 100644
index 000000000..56ea35c9f
--- /dev/null
+++ b/metagpt/ext/stanford_town/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : stanford town implement
diff --git a/metagpt/ext/stanford_town/actions/__init__.py b/metagpt/ext/stanford_town/actions/__init__.py
new file mode 100644
index 000000000..2bcf8efd0
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/metagpt/ext/stanford_town/actions/agent_chat_sum_rel.py b/metagpt/ext/stanford_town/actions/agent_chat_sum_rel.py
new file mode 100644
index 000000000..98d370bb0
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/agent_chat_sum_rel.py
@@ -0,0 +1,39 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : summarize relationship in a agent chat
+
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.logs import logger
+
+
+class AgentChatSumRel(STAction):
+    name: str = "AgentChatSumRel"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        resp = False
+        try:
+            _ = llm_resp.split('"')[0].strip()
+            resp = True
+        except Exception:
+            pass
+        return resp
+
+    def _func_cleanup(self, llm_resp: str, prompt: str) -> str:
+        return llm_resp.split('"')[0].strip()
+
+    def _func_fail_default_resp(self) -> str:
+        pass
+
+    async def run(self, init_role: "STRole", target_role: "STRole", statements: str) -> str:
+        def create_prompt_input(init_role: "STRole", target_role: "STRole", statements: str) -> str:
+            prompt_input = [statements, init_role.name, target_role.name]
+            return prompt_input
+
+        prompt_input = create_prompt_input(init_role, target_role, statements)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "summarize_chat_relationship_v2.txt")
+
+        example_output = "Jane Doe is working on a project"
+        special_instruction = "The output should be a string that responds to the question."
+        output = await self._run_gpt35(prompt, example_output, special_instruction)
+        logger.info(f"Role: {init_role.name} Action: {self.cls_name} output: {output}")
+        return output
diff --git a/metagpt/ext/stanford_town/actions/decide_to_talk.py b/metagpt/ext/stanford_town/actions/decide_to_talk.py
new file mode 100644
index 000000000..a393f31af
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/decide_to_talk.py
@@ -0,0 +1,97 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : device to talk to another role, return yes or no
+
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.logs import logger
+
+
+class DecideToTalk(STAction):
+    name: str = "DecideToTalk"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        resp = False
+        try:
+            if llm_resp.split("Answer in yes or no:")[-1].strip().lower() in ["yes", "no"]:
+                resp = True
+        except ValueError:
+            pass
+        return resp
+
+    def _func_cleanup(self, llm_resp: str, prompt: str) -> str:
+        return llm_resp.split("Answer in yes or no:")[-1].strip().lower()
+
+    def _func_fail_default_resp(self) -> str:
+        return "yes"
+
+    async def run(self, init_role: "STRole", target_role: "STRole", retrieved: dict, *args, **kwargs) -> bool:
+        """Run action"""
+
+        def create_prompt_input(init_role: "STRole", target_role: "STRole", retrieved: dict) -> str:
+            scratch = init_role.rc.scratch
+            target_scratch = target_role.rc.scratch
+            last_chat = init_role.rc.memory.get_last_chat(target_role.name)
+            last_chatted_time = ""
+            last_chat_about = ""
+            if last_chat:
+                last_chatted_time = last_chat.created.strftime("%B %d, %Y, %H:%M:%S")
+                last_chat_about = last_chat.description
+
+            context = ""
+            for c_node in retrieved["events"]:
+                curr_desc = c_node.description.split(" ")
+                curr_desc[2:3] = ["was"]
+                curr_desc = " ".join(curr_desc)
+                context += f"{curr_desc}. "
+            context += "\n"
+            for c_node in retrieved["thoughts"]:
+                context += f"{c_node.description}. "
+
+            curr_time = scratch.curr_time.strftime("%B %d, %Y, %H:%M:%S %p")
+            init_act_desc = scratch.act_description
+            if "(" in init_act_desc:
+                init_act_desc = init_act_desc.split("(")[-1][:-1]
+
+            if len(scratch.planned_path) == 0 and "waiting" not in init_act_desc:
+                init_p_desc = f"{init_role.name} is already {init_act_desc}"
+            elif "waiting" in init_act_desc:
+                init_p_desc = f"{init_role.name} is {init_act_desc}"
+            else:
+                init_p_desc = f"{init_role.name} is on the way to {init_act_desc}"
+
+            target_act_desc = scratch.act_description
+            if "(" in target_act_desc:
+                target_act_desc = target_act_desc.split("(")[-1][:-1]
+
+            if len(target_scratch.planned_path) == 0 and "waiting" not in init_act_desc:
+                target_p_desc = f"{target_role.name} is already {target_act_desc}"
+            elif "waiting" in init_act_desc:
+                target_p_desc = f"{init_role.name} is {init_act_desc}"
+            else:
+                target_p_desc = f"{target_role.name} is on the way to {target_act_desc}"
+
+            prompt_input = []
+            prompt_input += [context]
+
+            prompt_input += [curr_time]
+
+            prompt_input += [init_role.name]
+            prompt_input += [target_role.name]
+            prompt_input += [last_chatted_time]
+            prompt_input += [last_chat_about]
+
+            prompt_input += [init_p_desc]
+            prompt_input += [target_p_desc]
+            prompt_input += [init_role.name]
+            prompt_input += [target_role.name]
+            return prompt_input
+
+        prompt_input = create_prompt_input(init_role, target_role, retrieved)
+        prompt = self.generate_prompt_with_tmpl_filename(
+            prompt_input=prompt_input, tmpl_filename="decide_to_talk_v2.txt"
+        )
+        self.fail_default_resp = self._func_fail_default_resp()
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=20)  # yes or no
+        result = True if output == "yes" else False
+        logger.info(f"Role: {init_role.name} Action: {self.cls_name} output: {result}")
+        return result
diff --git a/metagpt/ext/stanford_town/actions/dummy_action.py b/metagpt/ext/stanford_town/actions/dummy_action.py
new file mode 100644
index 000000000..a5004d5ef
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/dummy_action.py
@@ -0,0 +1,20 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : dummy action to make every STRole can deal DummyMessage which is caused by DummyAction
+
+from metagpt.actions import Action
+from metagpt.schema import Message
+
+
+class DummyAction(Action):
+    async def run(self, *args, **kwargs):
+        raise NotImplementedError
+
+
+class DummyMessage(Message):
+    """
+    dummy message to pass to role and make them to have a execution every round
+    """
+
+    content: str = "dummy"
+    cause_by: str = "DummyAction"
diff --git a/metagpt/ext/stanford_town/actions/gen_action_details.py b/metagpt/ext/stanford_town/actions/gen_action_details.py
new file mode 100644
index 000000000..8e268a723
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/gen_action_details.py
@@ -0,0 +1,401 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : gen_action_details
+
+import random
+
+from metagpt.environment.stanford_town.env_space import EnvObsParams, EnvObsType
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.logs import logger
+
+
+class GenActionSector(STAction):
+    name: str = "GenActionSector"
+
+    def _func_cleanup(self, llm_resp: str, prompt: str):
+        cleaned_response = llm_resp.split("}")[0]
+        return cleaned_response
+
+    def _func_validate(self, llm_resp: str, prompt: str):
+        if len(llm_resp.strip()) < 1:
+            return False
+        if "}" not in llm_resp:
+            return False
+        if "," in llm_resp:
+            return False
+        return True
+
+    def _func_fail_default_resp(self):
+        fs = "kitchen"
+        return fs
+
+    async def run(self, role: "STRole", access_tile: dict[str, str], act_desp: str):
+        def create_prompt_input(role, access_tile: dict[str, str], act_desp):
+            act_world = f"{access_tile['world']}"
+
+            prompt_input = []
+
+            prompt_input += [role.scratch.get_str_name()]
+            prompt_input += [role.scratch.living_area.split(":")[1]]
+            x = f"{act_world}:{role.scratch.living_area.split(':')[1]}"
+            prompt_input += [role.s_mem.get_str_accessible_sector_arenas(x)]
+
+            prompt_input += [role.scratch.get_str_name()]
+            prompt_input += [f"{access_tile['sector']}"]
+            x = f"{act_world}:{access_tile['sector']}"
+            prompt_input += [role.s_mem.get_str_accessible_sector_arenas(x)]
+
+            if role.scratch.get_str_daily_plan_req() != "":
+                prompt_input += [f"\n{role.scratch.get_str_daily_plan_req()}"]
+            else:
+                prompt_input += [""]
+
+            # MAR 11 TEMP
+            prompt_input = []
+            act_world = access_tile["world"]
+            accessible_sector_str = role.s_mem.get_str_accessible_sectors(act_world)
+            curr = accessible_sector_str.split(", ")
+            fin_accessible_sectors = []
+            for i in curr:
+                if "'s house" in i:
+                    if role.scratch.last_name in i:
+                        fin_accessible_sectors += [i]
+            else:
+                fin_accessible_sectors += [i]
+            accessible_sector_str = ", ".join(fin_accessible_sectors)
+            # END MAR 11 TEMP
+
+            prompt_input += [accessible_sector_str]
+
+            act_desp_1 = act_desp
+            act_desp_2 = act_desp
+            if "(" in act_desp:
+                act_desp_1 = act_desp.split("(")[0].strip()
+                act_desp_2 = act_desp.split("(")[-1][:-1]
+            prompt_input += [role.scratch.get_str_name()]
+            prompt_input += [act_desp_1]
+
+            prompt_input += [act_desp_2]
+            prompt_input += [role.scratch.get_str_name()]
+            return prompt_input
+
+        prompt_template = "action_location_sector_v1.txt"
+        prompt_input = create_prompt_input(role, access_tile, act_desp)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, prompt_template)
+
+        self.fail_default_resp = self._func_fail_default_resp()
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=15)
+        y = f"{access_tile['world']}"
+        x = [i.strip() for i in role.s_mem.get_str_accessible_sectors(y).split(",")]
+        if output not in x:
+            # output = random.choice(x)
+            output = role.scratch.living_area.split(":")[1]
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+class GenActionArena(STAction):
+    name: str = "GenActionArena"
+
+    def _func_cleanup(self, llm_resp: str, prompt: str):
+        cleaned_response = llm_resp.split("}")[0]
+        return cleaned_response
+
+    def _func_validate(self, llm_resp: str, prompt: str):
+        if len(llm_resp.strip()) < 1:
+            return False
+        if "}" not in llm_resp:
+            return False
+        if "," in llm_resp:
+            return False
+        return True
+
+    def _func_fail_default_resp(self):
+        fs = "kitchen"
+        return fs
+
+    async def run(self, role: "STRole", act_desp: str, act_world: str, act_sector: str):
+        def create_prompt_input(role, act_desp, act_world, act_sector):
+            prompt_input = []
+            prompt_input += [role.scratch.get_str_name()]
+            x = f"{act_world}:{act_sector}"
+            prompt_input += [act_sector]
+
+            # MAR 11 TEMP
+            accessible_arena_str = role.s_mem.get_str_accessible_sector_arenas(x)
+            curr = accessible_arena_str.split(", ")
+            fin_accessible_arenas = []
+            for i in curr:
+                if "'s room" in i:
+                    if role.scratch.last_name in i:
+                        fin_accessible_arenas += [i]
+                else:
+                    fin_accessible_arenas += [i]
+            accessible_arena_str = ", ".join(fin_accessible_arenas)
+            # END MAR 11 TEMP
+            prompt_input += [accessible_arena_str]
+            act_desp_1 = act_desp
+            act_desp_2 = act_desp
+            if "(" in act_desp:
+                act_desp_1 = act_desp.split("(")[0].strip()
+                act_desp_2 = act_desp.split("(")[-1][:-1]
+            prompt_input += [role.scratch.get_str_name()]
+            prompt_input += [act_desp_1]
+
+            prompt_input += [act_desp_2]
+            prompt_input += [role.scratch.get_str_name()]
+
+            prompt_input += [act_sector]
+            prompt_input += [accessible_arena_str]
+            return prompt_input
+
+        prompt_template = "action_location_object_vMar11.txt"
+        prompt_input = create_prompt_input(role, act_desp, act_world, act_sector)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, prompt_template)
+        self.fail_default_resp = self._func_fail_default_resp()
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=15)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+class GenActionObject(STAction):
+    name: str = "GenActionObject"
+
+    def _func_validate(self, llm_resp: str, prompt: str):
+        if len(llm_resp.strip()) < 1:
+            return False
+        return True
+
+    def _func_cleanup(self, llm_resp: str, prompt: str):
+        cleaned_response = llm_resp.strip()
+        return cleaned_response
+
+    def _func_fail_default_resp(self):
+        fs = "bed"
+        return fs
+
+    async def run(self, role: "STRole", act_desp: str, temp_address: str):
+        def create_prompt_input(role, act_desp, temp_address):
+            prompt_input = []
+            if "(" in act_desp:
+                act_desp = act_desp.split("(")[-1][:-1]
+
+            prompt_input += [act_desp]
+            prompt_input += [role.s_mem.get_str_accessible_arena_game_objects(temp_address)]
+            return prompt_input
+
+        prompt_template = "action_object_v2.txt"
+        prompt_input = create_prompt_input(role, act_desp, temp_address)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, prompt_template)
+        self.fail_default_resp = self._func_fail_default_resp()
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=15)
+        x = [i.strip() for i in role.s_mem.get_str_accessible_arena_game_objects(temp_address).split(",")]
+        if output not in x:
+            output = random.choice(x)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+class GenPronunciatio(STAction):
+    name: str = "GenPronunciatio"
+
+    def _func_cleanup(self, llm_resp: str, prompt: str):
+        cr = llm_resp.strip()
+        if len(cr) > 3:
+            cr = cr[:3]
+        return cr
+
+    def _func_validate(self, llm_resp: str, prompt: str):
+        try:
+            self._func_cleanup(llm_resp, prompt="")
+            if len(llm_resp) == 0:
+                return False
+        except Exception:
+            return False
+        return True
+
+    def _func_fail_default_resp(self):
+        fs = "😋"
+        return fs
+
+    async def run(self, role: "STRole", act_desp: str):
+        def create_prompt_input(act_desp):
+            if "(" in act_desp:
+                act_desp = act_desp.split("(")[-1].split(")")[0]
+            prompt_input = [act_desp]
+            return prompt_input
+
+        prompt_template = "generate_pronunciatio_v1.txt"
+        prompt_input = create_prompt_input(act_desp)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, prompt_template)
+        example_output = "🛁🧖‍♀️"
+        special_instruction = "The value for the output must ONLY contain the emojis."
+        self.fail_default_resp = self._func_fail_default_resp()
+        output = await self._run_gpt35(prompt, example_output, special_instruction)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+class GenEventTriple(STAction):
+    name: str = "GenEventTriple"
+
+    def _func_cleanup(self, llm_resp: str, prompt: str):
+        cr = llm_resp.strip()
+        cr = [i.strip() for i in cr.split(")")[0].split(",")]
+        return cr
+
+    def _func_validate(self, llm_resp: str, prompt: str):
+        try:
+            llm_resp = self._func_cleanup(llm_resp, prompt="")
+            if len(llm_resp) != 2:
+                return False
+        except Exception:
+            return False
+        return True
+
+    def _func_fail_default_resp(self, role):
+        fs = (role.name, "is", "idle")
+        return fs
+
+    async def run(self, role: "STRole", act_desp: str):
+        def create_prompt_input(role, act_desp):
+            if "(" in act_desp:
+                act_desp = act_desp.split("(")[-1].split(")")[0]
+            prompt_input = [role.name, act_desp, role.name]
+            return prompt_input
+
+        prompt_template = "generate_event_triple_v1.txt"
+        prompt_input = create_prompt_input(role, act_desp)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, prompt_template)
+        self.fail_default_resp = self._func_fail_default_resp(role)
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=30)
+        output = (role.name, output[0], output[1])
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+class GenActObjDescription(STAction):
+    name: str = "GenActObjDescription"
+
+    def _func_cleanup(self, llm_resp: str, prompt: str):
+        cr = llm_resp.strip()
+        if cr[-1] == ".":
+            cr = cr[:-1]
+        return cr
+
+    def _func_validate(self, llm_resp: str, prompt: str):
+        try:
+            llm_resp = self._func_cleanup(llm_resp, prompt="")
+        except Exception:
+            return False
+        return True
+
+    def _func_fail_default_resp(self, act_game_object):
+        fs = f"{act_game_object} is idle"
+        return fs
+
+    async def run(self, role: "STRole", act_game_object: str, act_desp: str):
+        def create_prompt_input(act_game_object, act_desp, role):
+            prompt_input = [act_game_object, role.name, act_desp, act_game_object, act_game_object]
+            return prompt_input
+
+        prompt_template = "generate_obj_event_v1.txt"
+        prompt_input = create_prompt_input(act_game_object, act_desp, role)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, prompt_template)
+        example_output = "being fixed"
+        special_instruction = "The output should ONLY contain the phrase that should go in <fill in>."
+        self.fail_default_resp = self._func_fail_default_resp(act_game_object)
+        output = await self._run_gpt35(prompt, example_output, special_instruction)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+class GenObjEventTriple(STAction):
+    name: str = "GenObjEventTriple"
+
+    def _func_cleanup(self, llm_resp: str, prompt: str):
+        cr = llm_resp.strip()
+        cr = [i.strip() for i in cr.split(")")[0].split(",")]
+        return cr
+
+    def _func_validate(self, llm_resp: str, prompt: str):
+        try:
+            llm_resp = self._func_cleanup(llm_resp, prompt="")
+            if len(llm_resp) != 2:
+                return False
+        except Exception:
+            return False
+        return True
+
+    def _func_fail_default_resp(self, act_game_object: str):
+        fs = (act_game_object, "is", "idle")
+        return fs
+
+    async def run(self, role: "STRole", act_game_object, act_obj_desp):
+        def create_prompt_input(act_game_object, act_obj_desp):
+            prompt_input = [act_game_object, act_obj_desp, act_game_object]
+            return prompt_input
+
+        prompt_template = "generate_event_triple_v1.txt"
+        prompt_input = create_prompt_input(act_game_object, act_obj_desp)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, prompt_template)
+        self.fail_default_resp = self._func_fail_default_resp(act_game_object)
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=30)
+        output = (act_game_object, output[0], output[1])
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+class GenActionDetails(STAction):
+    name: str = "GenActionDetails"
+
+    def _func_cleanup(self, llm_resp: str, prompt: str) -> list:
+        pass
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        # TODO -- this sometimes generates error
+        try:
+            self._func_cleanup(llm_resp)
+        except Exception:
+            return False
+        return True
+
+    def _func_fail_default_resp(self):
+        fs = {}
+        return fs
+
+    async def run(self, role: "STRole", act_desp: str, act_dura):
+        access_tile = role.rc.env.observe(
+            obs_params=EnvObsParams(obs_type=EnvObsType.GET_TITLE, coord=role.scratch.curr_tile)
+        )
+        act_world = access_tile["world"]
+        act_sector = await GenActionSector().run(role, access_tile, act_desp)
+        act_arena = await GenActionArena().run(role, act_desp, act_world, act_sector)
+        act_address = f"{act_world}:{act_sector}:{act_arena}"
+        if not role.s_mem.get_str_accessible_arena_game_objects(act_address):
+            act_game_object = "<random>"
+        else:
+            act_game_object = await GenActionObject().run(role, act_desp, act_address)
+        new_address = f"{act_world}:{act_sector}:{act_arena}:{act_game_object}"
+        act_pron = await GenPronunciatio().run(role, act_desp)
+        act_event = await GenEventTriple().run(role, act_desp)
+        # Persona's actions also influence the object states. We set those up here.
+        act_obj_desp = await GenActObjDescription().run(role, act_game_object, act_desp)
+        act_obj_pron = await GenPronunciatio().run(role, act_obj_desp)
+        act_obj_event = await GenObjEventTriple().run(role, act_game_object, act_obj_desp)
+        result_dict = {
+            "action_address": new_address,
+            "action_duration": int(act_dura),
+            "action_description": act_desp,
+            "action_pronunciatio": act_pron,
+            "action_event": act_event,
+            "chatting_with": None,
+            "chat": None,
+            "chatting_with_buffer": None,
+            "chatting_end_time": None,
+            "act_obj_description": act_obj_desp,
+            "act_obj_pronunciatio": act_obj_pron,
+            "act_obj_event": act_obj_event,
+        }
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {result_dict}")
+        return result_dict
diff --git a/metagpt/ext/stanford_town/actions/gen_daily_schedule.py b/metagpt/ext/stanford_town/actions/gen_daily_schedule.py
new file mode 100644
index 000000000..5dffa8995
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/gen_daily_schedule.py
@@ -0,0 +1,60 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : gen_daily_schedule
+
+
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.logs import logger
+
+
+class GenDailySchedule(STAction):
+    name: str = "GenDailySchedule"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        try:
+            self._func_cleanup(llm_resp, prompt="")
+        except Exception:
+            return False
+        return True
+
+    def _func_cleanup(self, llm_resp: str, prompt: str) -> list:
+        cr = []
+        _cr = llm_resp.split(")")
+        for i in _cr:
+            if i[-1].isdigit():
+                i = i[:-1].strip()
+                if i[-1] == "." or i[-1] == ",":
+                    cr += [i[:-1].strip()]
+        return cr
+
+    def _func_fail_default_resp(self) -> int:
+        fs = [
+            "wake up and complete the morning routine at 6:00 am",
+            "eat breakfast at 7:00 am",
+            "read a book from 8:00 am to 12:00 pm",
+            "have lunch at 12:00 pm",
+            "take a nap from 1:00 pm to 4:00 pm",
+            "relax and watch TV from 7:00 pm to 8:00 pm",
+            "go to bed at 11:00 pm",
+        ]
+        return fs
+
+    async def run(self, role: "STRole", wake_up_hour: str):
+        def create_prompt_input(role, wake_up_hour):
+            prompt_input = []
+            prompt_input += [role.scratch.get_str_iss()]
+            prompt_input += [role.scratch.get_str_lifestyle()]
+            prompt_input += [role.scratch.get_str_curr_date_str()]
+            prompt_input += [role.scratch.get_str_firstname()]
+            prompt_input += [f"{str(wake_up_hour)}:00 am"]
+            return prompt_input
+
+        wake_up_hour = int(wake_up_hour)
+        prompt_template = "daily_planning_v6.txt"
+        prompt_input = create_prompt_input(role, wake_up_hour)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, prompt_template)
+        self.fail_default_resp = self._func_fail_default_resp()
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=500)
+        output = [f"wake up and complete the morning routine at {wake_up_hour}:00 am"] + output
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
diff --git a/metagpt/ext/stanford_town/actions/gen_hourly_schedule.py b/metagpt/ext/stanford_town/actions/gen_hourly_schedule.py
new file mode 100644
index 000000000..5d59f96dd
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/gen_hourly_schedule.py
@@ -0,0 +1,181 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : gen_hourly_schedule
+
+import random
+import string
+
+from metagpt.logs import logger
+
+from .st_action import STAction
+
+
+def get_random_alphanumeric(i=6, j=6):
+    """
+    Returns a random alpha numeric strength that has the length of somewhere
+    between i and j.
+
+    INPUT:
+        i: min_range for the length
+        j: max_range for the length
+    OUTPUT:
+        an alpha numeric str with the length of somewhere between i and j.
+    """
+    k = random.randint(i, j)
+    x = "".join(random.choices(string.ascii_letters + string.digits, k=k))
+    return x
+
+
+class GenHourlySchedule(STAction):
+    name: str = "GenHourlySchedule"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        try:
+            self._func_cleanup(llm_resp, prompt="")
+        except Exception:
+            return False
+        return True
+
+    def _func_cleanup(self, llm_resp: str, prompt: str) -> list:
+        cr = llm_resp.strip()
+        if cr[-1] == ".":
+            cr = cr[:-1]
+        # to only use the first line of output
+        cr = cr.split("\n")[0]
+        return cr
+
+    def _func_fail_default_resp(self) -> int:
+        fs = "asleep"
+        return fs
+
+    async def _generate_schedule_for_given_hour(
+        self, role: "STRole", curr_hour_str, p_f_ds_hourly_org, hour_str, intermission2=None
+    ):
+        def create_prompt_input(persona, curr_hour_str, p_f_ds_hourly_org, hour_str, intermission2=None):
+            schedule_format = ""
+            for i in hour_str:
+                schedule_format += f"[{persona.scratch.get_str_curr_date_str()} -- {i}]"
+                schedule_format += " Activity: [Fill in]\n"
+            schedule_format = schedule_format[:-1]
+
+            intermission_str = "Here the originally intended hourly breakdown of"
+            intermission_str += f" {persona.scratch.get_str_firstname()}'s schedule today: "
+            for count, i in enumerate(persona.scratch.daily_req):
+                intermission_str += f"{str(count + 1)}) {i}, "
+            intermission_str = intermission_str[:-2]
+
+            prior_schedule = ""
+            if p_f_ds_hourly_org:
+                prior_schedule = "\n"
+                for count, i in enumerate(p_f_ds_hourly_org):
+                    prior_schedule += f"[(ID:{get_random_alphanumeric()})"
+                    prior_schedule += f" {persona.scratch.get_str_curr_date_str()} --"
+                    prior_schedule += f" {hour_str[count]}] Activity:"
+                    prior_schedule += f" {persona.scratch.get_str_firstname()}"
+                    prior_schedule += f" is {i}\n"
+
+            prompt_ending = f"[(ID:{get_random_alphanumeric()})"
+            prompt_ending += f" {persona.scratch.get_str_curr_date_str()}"
+            prompt_ending += f" -- {curr_hour_str}] Activity:"
+            prompt_ending += f" {persona.scratch.get_str_firstname()} is"
+
+            if intermission2:
+                intermission2 = f"\n{intermission2}"
+
+            prompt_input = []
+            prompt_input += [schedule_format]
+            prompt_input += [persona.scratch.get_str_iss()]
+
+            prompt_input += [prior_schedule + "\n"]
+            prompt_input += [intermission_str]
+            if intermission2:
+                prompt_input += [intermission2]
+            else:
+                prompt_input += [""]
+                prompt_input += [prompt_ending]
+
+            return prompt_input
+
+        prompt_template = "generate_hourly_schedule_v2.txt"
+        prompt_input = create_prompt_input(role, curr_hour_str, p_f_ds_hourly_org, hour_str, intermission2)
+        prompt_input_str = "\n".join(prompt_input)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, prompt_template)
+        self.fail_default_resp = self._func_fail_default_resp()
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=50)
+        logger.info(
+            f"Role: {role.name} _generate_schedule_for_given_hour prompt_input: {prompt_input_str}, "
+            f"output: {output}"
+        )
+        return output
+
+    async def run(self, role: "STRole", wake_up_hour: int):
+        hour_str = [
+            "00:00 AM",
+            "01:00 AM",
+            "02:00 AM",
+            "03:00 AM",
+            "04:00 AM",
+            "05:00 AM",
+            "06:00 AM",
+            "07:00 AM",
+            "08:00 AM",
+            "09:00 AM",
+            "10:00 AM",
+            "11:00 AM",
+            "12:00 PM",
+            "01:00 PM",
+            "02:00 PM",
+            "03:00 PM",
+            "04:00 PM",
+            "05:00 PM",
+            "06:00 PM",
+            "07:00 PM",
+            "08:00 PM",
+            "09:00 PM",
+            "10:00 PM",
+            "11:00 PM",
+        ]
+        n_m1_activity = []
+        diversity_repeat_count = 1  # TODO mg 1->3
+        for i in range(diversity_repeat_count):
+            logger.info(f"diversity_repeat_count idx: {i}")
+            n_m1_activity_set = set(n_m1_activity)
+            if len(n_m1_activity_set) < 5:
+                n_m1_activity = []
+                for count, curr_hour_str in enumerate(hour_str):
+                    if wake_up_hour > 0:
+                        n_m1_activity += ["sleeping"]
+                        wake_up_hour -= 1
+                    else:
+                        logger.info(f"_generate_schedule_for_given_hour idx: {count}, n_m1_activity: {n_m1_activity}")
+                        n_m1_activity += [
+                            await self._generate_schedule_for_given_hour(role, curr_hour_str, n_m1_activity, hour_str)
+                        ]
+
+        # Step 1. Compressing the hourly schedule to the following format:
+        # The integer indicates the number of hours. They should add up to 24.
+        # [['sleeping', 6], ['waking up and starting her morning routine', 1],
+        # ['eating breakfast', 1], ['getting ready for the day', 1],
+        # ['working on her painting', 2], ['taking a break', 1],
+        # ['having lunch', 1], ['working on her painting', 3],
+        # ['taking a break', 2], ['working on her painting', 2],
+        # ['relaxing and watching TV', 1], ['going to bed', 1], ['sleeping', 2]]
+        _n_m1_hourly_compressed = []
+        prev = None
+        prev_count = 0
+        for i in n_m1_activity:
+            if i != prev:
+                prev_count = 1
+                _n_m1_hourly_compressed += [[i, prev_count]]
+                prev = i
+            elif _n_m1_hourly_compressed:
+                _n_m1_hourly_compressed[-1][1] += 1
+
+        # Step 2. Expand to min scale (from hour scale)
+        # [['sleeping', 360], ['waking up and starting her morning routine', 60],
+        # ['eating breakfast', 60],..
+        n_m1_hourly_compressed = []
+        for task, duration in _n_m1_hourly_compressed:
+            n_m1_hourly_compressed += [[task, duration * 60]]
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {n_m1_hourly_compressed}")
+        return n_m1_hourly_compressed
diff --git a/metagpt/ext/stanford_town/actions/gen_iter_chat_utt.py b/metagpt/ext/stanford_town/actions/gen_iter_chat_utt.py
new file mode 100644
index 000000000..40f6d3af0
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/gen_iter_chat_utt.py
@@ -0,0 +1,125 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : generate_iterative_chat_utt
+
+from metagpt.environment.stanford_town.env_space import EnvObsParams, EnvObsType
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.ext.stanford_town.utils.utils import extract_first_json_dict
+from metagpt.logs import logger
+
+
+class GenIterChatUTT(STAction):
+    name: str = "GenIterChatUTT"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        resp = False
+        try:
+            _ = extract_first_json_dict(llm_resp)
+            resp = True
+        except Exception:
+            pass
+        return resp
+
+    def _func_cleanup(self, llm_resp: str, prompt: str) -> dict:
+        gpt_response = extract_first_json_dict(llm_resp)
+
+        cleaned_dict = dict()
+        cleaned = []
+        for key, val in gpt_response.items():
+            cleaned += [val]
+        cleaned_dict["utterance"] = cleaned[0]
+        cleaned_dict["end"] = True
+        if "f" in str(cleaned[1]) or "F" in str(cleaned[1]):
+            cleaned_dict["end"] = False
+
+        return cleaned_dict
+
+    def _func_fail_default_resp(self) -> dict:
+        cleaned_dict = dict()
+        cleaned_dict["utterance"] = "..."
+        cleaned_dict["end"] = False
+        return cleaned_dict
+
+    async def run(
+        self,
+        init_role: "STRole",
+        target_role: "STRole",
+        retrieved: dict,
+        curr_context: str,
+        curr_chat: list[str],
+        *args,
+        **kwargs,
+    ) -> dict:
+        def create_prompt_input(
+            access_tile: dict[str, str],
+            init_role: "STRole",
+            target_role: "STRole",
+            retrieved: dict,
+            curr_context: str,
+            curr_chat: list[str],
+        ):
+            role = init_role
+            scratch = role.rc.scratch
+            target_scratch = target_role.rc.scratch
+            prev_convo_insert = "\n"
+            if role.rc.memory.chat_list:
+                for i in role.rc.memory.chat_list:
+                    if i.object == target_role.name:
+                        v1 = int((scratch.curr_time - i.created).total_seconds() / 60)
+                        prev_convo_insert += (
+                            f"{str(v1)} minutes ago, {scratch.name} and "
+                            f"{target_scratch.name} were already {i.description} "
+                            f"This context takes place after that conversation."
+                        )
+                        break
+            if prev_convo_insert == "\n":
+                prev_convo_insert = ""
+            if role.rc.memory.chat_list:
+                if int((scratch.curr_time - role.rc.memory.chat_list[-1].created).total_seconds() / 60) > 480:
+                    prev_convo_insert = ""
+            logger.info(f"prev_convo_insert: {prev_convo_insert}")
+
+            curr_sector = f"{access_tile['sector']}"
+            curr_arena = f"{access_tile['arena']}"
+            curr_location = f"{curr_arena} in {curr_sector}"
+
+            retrieved_str = ""
+            for key, vals in retrieved.items():
+                for v in vals:
+                    retrieved_str += f"- {v.description}\n"
+
+            convo_str = ""
+            for i in curr_chat:
+                convo_str += ": ".join(i) + "\n"
+            if convo_str == "":
+                convo_str = "[The conversation has not started yet -- start it!]"
+
+            init_iss = f"Here is Here is a brief description of {scratch.name}.\n{scratch.get_str_iss()}"
+            prompt_input = [
+                init_iss,
+                scratch.name,
+                retrieved_str,
+                prev_convo_insert,
+                curr_location,
+                curr_context,
+                scratch.name,
+                target_scratch.name,
+                convo_str,
+                scratch.name,
+                target_scratch.name,
+                scratch.name,
+                scratch.name,
+                scratch.name,
+            ]
+            return prompt_input
+
+        access_tile = init_role.rc.env.observe(
+            obs_params=EnvObsParams(obs_type=EnvObsType.GET_TITLE, coord=init_role.scratch.curr_tile)
+        )
+        prompt_input = create_prompt_input(access_tile, init_role, target_role, retrieved, curr_context, curr_chat)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "iterative_convo_v1.txt")
+        # original using `ChatGPT_safe_generate_response_OLD`
+        self.fail_default_resp = self._func_fail_default_resp()
+        output = await self._run_gpt35_wo_extra_prompt(prompt)
+        logger.info(f"Role: {init_role.name} Action: {self.cls_name} output: {output}")
+        return output
diff --git a/metagpt/ext/stanford_town/actions/inner_voice_action.py b/metagpt/ext/stanford_town/actions/inner_voice_action.py
new file mode 100644
index 000000000..83cfa037b
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/inner_voice_action.py
@@ -0,0 +1,35 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
+
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.logs import logger
+
+
+class AgentWhisperThoughtAction(STAction):
+    name: str = "AgentWhisperThoughtAction"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        try:
+            self._func_cleanup(llm_resp, prompt)
+            return True
+        except Exception:
+            return False
+
+    def _func_cleanup(self, llm_resp: str, prompt: str = "") -> list:
+        return llm_resp.split('"')[0].strip()
+
+    def _func_fail_default_resp(self) -> str:
+        pass
+
+    async def run(self, role: "STRole", statements: str, test_input=None, verbose=False) -> str:
+        def create_prompt_input(role: "STRole", statements, test_input=None):
+            prompt_input = [role.scratch.name, statements]
+            return prompt_input
+
+        prompt_input = create_prompt_input(role, statements)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "whisper_inner_thought_v1.txt")
+
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=50)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
diff --git a/metagpt/ext/stanford_town/actions/new_decomp_schedule.py b/metagpt/ext/stanford_town/actions/new_decomp_schedule.py
new file mode 100644
index 000000000..759ec170f
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/new_decomp_schedule.py
@@ -0,0 +1,154 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : new_decomp_schedule
+
+import datetime
+
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.logs import logger
+
+
+class NewDecompSchedule(STAction):
+    name: str = "NewDecompSchedule"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        resp = False
+        try:
+            llm_resp = self._func_cleanup(llm_resp, prompt)
+            dur_sum = 0
+            for act, dur in llm_resp:
+                dur_sum += dur
+                if isinstance(act, str):
+                    return False
+                if isinstance(dur, int):
+                    return False
+            x = prompt.split("\n")[0].split("originally planned schedule from")[-1].strip()[:-1]
+            x = [datetime.datetime.strptime(i.strip(), "%H:%M %p") for i in x.split(" to ")]
+            delta_min = int((x[1] - x[0]).total_seconds() / 60)
+
+            if int(dur_sum) != int(delta_min):
+                return False
+        except Exception:
+            pass
+        return resp
+
+    def _func_cleanup(self, llm_resp: str, prompt: str) -> list:
+        new_schedule = prompt + " " + llm_resp.strip()
+        new_schedule = new_schedule.split("The revised schedule:")[-1].strip()
+        new_schedule = new_schedule.split("\n")
+
+        ret_temp = []
+        for i in new_schedule:
+            ret_temp += [i.split(" -- ")]
+
+        ret = []
+        for time_str, action in ret_temp:
+            start_time = time_str.split(" ~ ")[0].strip()
+            end_time = time_str.split(" ~ ")[1].strip()
+            delta = datetime.datetime.strptime(end_time, "%H:%M") - datetime.datetime.strptime(start_time, "%H:%M")
+            delta_min = int(delta.total_seconds() / 60)
+            if delta_min < 0:
+                delta_min = 0
+            ret += [[action, delta_min]]
+
+        return ret
+
+    def _func_fail_default_resp(self, main_act_dur: int, truncated_act_dur: int) -> int:
+        dur_sum = 0
+        for act, dur in main_act_dur:
+            dur_sum += dur
+
+        ret = truncated_act_dur[:]
+        ret += main_act_dur[len(ret) - 1 :]
+
+        # If there are access, we need to trim...
+        ret_dur_sum = 0
+        count = 0
+        over = None
+        for act, dur in ret:
+            ret_dur_sum += dur
+            if ret_dur_sum == dur_sum:
+                break
+            if ret_dur_sum > dur_sum:
+                over = ret_dur_sum - dur_sum
+                break
+            count += 1
+
+        if over:
+            ret = ret[: count + 1]
+            ret[-1][1] -= over
+
+        return ret
+
+    async def run(
+        self,
+        role: "STRole",
+        main_act_dur: int,
+        truncated_act_dur: int,
+        start_time_hour: datetime,
+        end_time_hour: datetime,
+        inserted_act: str,
+        inserted_act_dur: int,
+        *args,
+        **kwargs,
+    ):
+        def create_prompt_input(
+            role: "STRole",
+            main_act_dur: int,
+            truncated_act_dur: int,
+            start_time_hour: datetime,
+            end_time_hour: datetime,
+            inserted_act: str,
+            inserted_act_dur: int,
+        ):
+            persona_name = role.name
+            start_hour_str = start_time_hour.strftime("%H:%M %p")
+            end_hour_str = end_time_hour.strftime("%H:%M %p")
+
+            original_plan = ""
+            for_time = start_time_hour
+            for i in main_act_dur:
+                original_plan += (
+                    f'{for_time.strftime("%H:%M")} ~ '
+                    f'{(for_time + datetime.timedelta(minutes=int(i[1]))).strftime("%H:%M")} -- ' + i[0]
+                )
+                original_plan += "\n"
+                for_time += datetime.timedelta(minutes=int(i[1]))
+
+            new_plan_init = ""
+            for_time = start_time_hour
+            for count, i in enumerate(truncated_act_dur):
+                new_plan_init += (
+                    f'{for_time.strftime("%H:%M")} ~ '
+                    f'{(for_time + datetime.timedelta(minutes=int(i[1]))).strftime("%H:%M")} -- ' + i[0]
+                )
+                new_plan_init += "\n"
+                if count < len(truncated_act_dur) - 1:
+                    for_time += datetime.timedelta(minutes=int(i[1]))
+
+            new_plan_init += (for_time + datetime.timedelta(minutes=int(i[1]))).strftime("%H:%M") + " ~"
+
+            prompt_input = [
+                persona_name,
+                start_hour_str,
+                end_hour_str,
+                original_plan,
+                persona_name,
+                inserted_act,
+                inserted_act_dur,
+                persona_name,
+                start_hour_str,
+                end_hour_str,
+                end_hour_str,
+                new_plan_init,
+            ]
+            return prompt_input
+
+        prompt_input = create_prompt_input(
+            role, main_act_dur, truncated_act_dur, start_time_hour, end_time_hour, inserted_act, inserted_act_dur
+        )
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "new_decomp_schedule_v1.txt")
+        self.fail_default_resp = self._func_fail_default_resp(main_act_dur, truncated_act_dur)
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=1000)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
diff --git a/metagpt/ext/stanford_town/actions/run_reflect_action.py b/metagpt/ext/stanford_town/actions/run_reflect_action.py
new file mode 100644
index 000000000..895f6828f
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/run_reflect_action.py
@@ -0,0 +1,277 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : Integration Reflect Action
+
+import re
+
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.logs import logger
+
+
+# Run GPT Prompt Focal Point method
+class AgentFocusPt(STAction):
+    name: str = "AgentFocusPt"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        try:
+            self._func_cleanup(llm_resp, prompt)
+            return True
+        except Exception:
+            return False
+
+    def _func_cleanup(self, llm_resp: str, prompt: str = "") -> str:
+        try:
+            """
+            Cleanup handling has been completed for run_v2
+            """
+            return llm_resp
+        except Exception as exp:
+            logger.error(f"{self.cls_name} with error {exp}")
+
+    def _func_fail_default_resp(self) -> str:
+        pass
+
+    async def run(self, role: "STRole", statements: str, n: int, test_input=None) -> str:
+        def create_prompt_input(role: "STRole", statements, n, test_input=None):
+            prompt_input = [statements, str(n)]
+            return prompt_input
+
+        prompt_input = create_prompt_input(role, statements, n)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "generate_focal_pt_v1.txt")
+
+        example_output = '["What should Jane do for lunch", "Does Jane like strawberry", "Who is Jane"]'
+        special_instruction = "Output must be a list of str."
+        output = await self._run_gpt35(prompt, example_output, special_instruction)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+# Run GPT Prompt Insight and Guidance
+class AgentInsightAndGuidance(STAction):
+    name: str = "AgentInsightAndGuidance"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        try:
+            self._func_cleanup(llm_resp, prompt)
+            return True
+        except Exception:
+            return False
+
+    def _func_cleanup(self, llm_resp: str, prompt: str = "") -> dict:
+        try:
+            llm_resp = "1. " + llm_resp.strip()
+            ret = dict()
+            for i in llm_resp.split("\n"):
+                row = " ".join(i.split(". ")[1:])
+                if "(because of " not in row:
+                    continue
+                thought = row.split("(because of ")[0].strip()
+                if ")" not in row.split("(because of ")[1]:
+                    continue
+                evi_raw = row.split("(because of ")[1].split(")")[0].strip()
+                evi_raw = re.findall(r"\d+", evi_raw)
+                evi_raw = [int(i.strip()) for i in evi_raw]
+                ret[thought] = evi_raw
+            return ret
+        except Exception as exp:
+            logger.error(f"{self.cls_name} with error {exp}")
+
+    def _func_fail_default_resp(self, n: int) -> str:
+        return ["I am hungry"] * n
+
+    async def run(self, role: "STRole", statements: str, n: int, test_input=None) -> dict:
+        def create_prompt_input(role, statements, n, test_input=None):
+            prompt_input = [statements, str(n)]
+            return prompt_input
+
+        prompt_input = create_prompt_input(role, statements, n)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "insight_and_evidence_v1.txt")
+
+        self.fail_default_resp = self._func_fail_default_resp(n)
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=150)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+# Run GPT Prompt Event Triple
+class AgentEventTriple(STAction):
+    name: str = "AgentEventTriple"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        try:
+            llm_resp = self._func_cleanup(llm_resp, prompt="")
+            if len(llm_resp) != 2:
+                return False
+        except Exception:
+            return False
+        return True
+
+    def _func_cleanup(self, llm_resp: str, prompt: str = "") -> list:
+        try:
+            cr = llm_resp.strip()
+            cr = [i.strip() for i in cr.split(")")[0].split(",")]
+            if len(cr) != 2:
+                return cr[-2:]
+            return cr
+        except Exception as exp:
+            logger.error(f"{self.cls_name} with error {exp}")
+
+    def _func_fail_default_resp(self) -> str:
+        pass
+
+    async def run(self, statements: str, role: "STRole", verbose=False) -> tuple:
+        def create_prompt_input(statements, role):
+            if "(" in statements:
+                statements = statements.split("(")[-1].split(")")[0]
+            prompt_input = [role.scratch.name, statements, role.scratch.name]
+            return prompt_input
+
+        prompt_input = create_prompt_input(statements, role)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "generate_event_triple_v1.txt")
+
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=30)
+        output = (role.scratch.name, output[0], output[1])
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+# Run GPT Prompt Event Poignancy
+class AgentEventPoignancy(STAction):
+    name: str = "AgentEventPoignancy"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        try:
+            self._func_cleanup(llm_resp, prompt)
+            return True
+        except Exception:
+            return False
+
+    def _func_cleanup(self, llm_resp: str, prompt: str = "") -> int:
+        try:
+            llm_resp = int(llm_resp.strip())
+            return llm_resp
+        except Exception as exp:
+            logger.error(f"{self.cls_name} with error {exp}")
+
+    def _func_fail_default_resp(self) -> str:
+        pass
+
+    async def run(self, role: "STRole", statements: str, test_input=None, verbose=False) -> str:
+        def create_prompt_input(role: "STRole", statements: str, test_input=None):
+            prompt_input = [role.scratch.name, role.scratch.get_str_iss(), role.scratch.name, statements]
+            return prompt_input
+
+        prompt_input = create_prompt_input(role, statements)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "poignancy_event_v1.txt")
+
+        example_output = "5"  # ########
+        special_instruction = "The output should ONLY contain ONE integer value on the scale of 1 to 10."
+        output = await self._run_gpt35(prompt, example_output, special_instruction)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+# Run GPT Prompt Chat Poignancy
+class AgentChatPoignancy(STAction):
+    name: str = "AgentChatPoignancy"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        try:
+            self._func_cleanup(llm_resp, prompt)
+            return True
+        except Exception:
+            return False
+
+    def _func_cleanup(self, llm_resp: str, prompt: str = "") -> int:
+        try:
+            llm_resp = int(llm_resp.strip())
+            return llm_resp
+        except Exception as exp:
+            logger.error(f"{self.cls_name} with error {exp}")
+
+    def _func_fail_default_resp(self) -> str:
+        pass
+
+    async def run(self, role: "STRole", statements: str, test_input=None, verbose=False) -> str:
+        def create_prompt_input(role: "STRole", statements, test_input=None):
+            prompt_input = [role.scratch.name, role.scratch.get_str_iss(), role.scratch.name, statements]
+            return prompt_input
+
+        prompt_input = create_prompt_input(role, statements)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "poignancy_chat_v1.txt")
+
+        example_output = "5"  # ########
+        special_instruction = "The output should ONLY contain ONE integer value on the scale of 1 to 10."
+        output = await self._run_gpt35(prompt, example_output, special_instruction)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+# Run GPT Prompt Planning Thought on Convo
+class AgentPlanThoughtOnConvo(STAction):
+    name: str = "AgentPlanThoughtOnConvo"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        try:
+            self._func_cleanup(llm_resp, prompt)
+            return True
+        except Exception:
+            return False
+
+    def _func_cleanup(self, llm_resp: str, prompt: str = "") -> str:
+        try:
+            return llm_resp.split('"')[0].strip()
+        except Exception as exp:
+            logger.error(f"{self.cls_name} with error {exp}")
+
+    def _func_fail_default_resp(self) -> str:
+        pass
+
+    async def run(self, role: "STRole", statements: str, test_input=None, verbose=False) -> str:
+        def create_prompt_input(role, statements, test_input=None):
+            prompt_input = [statements, role.scratch.name, role.scratch.name, role.scratch.name]
+            return prompt_input
+
+        prompt_input = create_prompt_input(role, statements)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "planning_thought_on_convo_v1.txt")
+
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=50)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
+
+
+# Run GPT Prompt Memory on Convo
+class AgentMemoryOnConvo(STAction):
+    name: str = "AgentMemoryOnConvo"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        try:
+            self._func_cleanup(llm_resp, prompt)
+            return True
+        except Exception:
+            return False
+
+    def _func_cleanup(self, llm_resp: str, prompt: str = "") -> str:
+        try:
+            return llm_resp.split('"')[0].strip()
+        except Exception as exp:
+            logger.error(f"{self.cls_name} with error {exp}")
+
+    def _func_fail_default_resp(self) -> str:
+        pass
+
+    async def run(self, role: "STRole", statements: str, test_input=None, verbose=False) -> str:
+        def create_prompt_input(role, statements, test_input=None):
+            prompt_input = [statements, role.scratch.name, role.scratch.name, role.scratch.name]
+            return prompt_input
+
+        prompt_input = create_prompt_input(role, statements)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "memo_on_convo_v1.txt")
+        example_output = "Jane Doe was interesting to talk to."
+        special_instruction = (
+            "The output should ONLY contain a string that summarizes anything interesting "
+            "that the agent may have noticed"
+        )
+        output = await self._run_gpt35(prompt, example_output, special_instruction)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
diff --git a/metagpt/ext/stanford_town/actions/st_action.py b/metagpt/ext/stanford_town/actions/st_action.py
new file mode 100644
index 000000000..321676374
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/st_action.py
@@ -0,0 +1,119 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : StanfordTown Action
+import json
+import time
+from abc import abstractmethod
+from pathlib import Path
+from typing import Any, Optional, Union
+
+from metagpt.actions.action import Action
+from metagpt.config2 import config
+from metagpt.ext.stanford_town.utils.const import PROMPTS_DIR
+from metagpt.logs import logger
+
+
+class STAction(Action):
+    name: str = "STAction"
+    prompt_dir: Path = PROMPTS_DIR
+    fail_default_resp: Optional[str] = None
+
+    @property
+    def cls_name(self):
+        return self.__class__.__name__
+
+    @abstractmethod
+    def _func_validate(self, llm_resp: str, prompt: str):
+        raise NotImplementedError
+
+    @abstractmethod
+    def _func_cleanup(self, llm_resp: str, prompt: str):
+        raise NotImplementedError
+
+    @abstractmethod
+    def _func_fail_default_resp(self):
+        raise NotImplementedError
+
+    def generate_prompt_with_tmpl_filename(self, prompt_input: Union[str, list], tmpl_filename) -> str:
+        """
+        same with `generate_prompt`
+        Args:
+            prompt_input: the input we want to feed in (IF THERE ARE MORE THAN ONE INPUT, THIS CAN BE A LIST.)
+            tmpl_filename: prompt template filename
+        Returns:
+            a str prompt that will be sent to LLM server.
+        """
+        if isinstance(prompt_input, str):
+            prompt_input = [prompt_input]
+        prompt_input = [str(i) for i in prompt_input]
+
+        f = open(str(self.prompt_dir.joinpath(tmpl_filename)), "r")
+        prompt = f.read()
+        f.close()
+        for count, i in enumerate(prompt_input):
+            prompt = prompt.replace(f"!<INPUT {count}>!", i)
+        if "<commentblockmarker>###</commentblockmarker>" in prompt:
+            prompt = prompt.split("<commentblockmarker>###</commentblockmarker>")[1]
+        return prompt.strip()
+
+    async def _aask(self, prompt: str) -> str:
+        return await self.llm.aask(prompt)
+
+    async def _run_gpt35_max_tokens(self, prompt: str, max_tokens: int = 50, retry: int = 3):
+        for idx in range(retry):
+            try:
+                tmp_max_tokens_rsp = getattr(config.llm, "max_token", 1500)
+                setattr(config.llm, "max_token", max_tokens)
+                self.llm.use_system_prompt = False  # to make it behave like a non-chat completions
+
+                llm_resp = await self._aask(prompt)
+
+                setattr(config.llm, "max_token", tmp_max_tokens_rsp)
+                logger.info(f"Action: {self.cls_name} llm _run_gpt35_max_tokens raw resp: {llm_resp}")
+                if self._func_validate(llm_resp, prompt):
+                    return self._func_cleanup(llm_resp, prompt)
+            except Exception as exp:
+                logger.warning(f"Action: {self.cls_name} _run_gpt35_max_tokens exp: {exp}")
+                time.sleep(5)
+        return self.fail_default_resp
+
+    async def _run_gpt35(
+        self, prompt: str, example_output: str, special_instruction: str, retry: int = 3
+    ) -> Union[bool, Any]:
+        """same with `gpt_structure.ChatGPT_safe_generate_response`"""
+        prompt = '"""\n' + prompt + '\n"""\n'
+        prompt += f"Output the response to the prompt above in json. {special_instruction}\n"
+        prompt += "Example output json:\n"
+        prompt += '{"output": "' + str(example_output) + '"}'
+
+        for idx in range(retry):
+            try:
+                llm_resp = await self._aask(prompt)
+                logger.info(f"Action: {self.cls_name} llm _run_gpt35 raw resp: {llm_resp}")
+                end_idx = llm_resp.strip().rfind("}") + 1
+                llm_resp = llm_resp[:end_idx]
+                llm_resp = json.loads(llm_resp)["output"]
+
+                if self._func_validate(llm_resp, prompt):
+                    return self._func_cleanup(llm_resp, prompt)
+            except Exception as exp:
+                logger.warning(f"Action: {self.cls_name} _run_gpt35 exp: {exp}")
+                time.sleep(5)  # usually avoid `Rate limit`
+        return False
+
+    async def _run_gpt35_wo_extra_prompt(self, prompt: str, retry: int = 3) -> str:
+        for idx in range(retry):
+            try:
+                llm_resp = await self._aask(prompt)
+                llm_resp = llm_resp.strip()
+                logger.info(f"Action: {self.cls_name} llm _run_gpt35_wo_extra_prompt raw resp: {llm_resp}")
+                if self._func_validate(llm_resp, prompt):
+                    return self._func_cleanup(llm_resp, prompt)
+            except Exception as exp:
+                logger.warning(f"Action: {self.cls_name} _run_gpt35_wo_extra_prompt exp: {exp}")
+                time.sleep(5)  # usually avoid `Rate limit`
+        return self.fail_default_resp
+
+    async def run(self, *args, **kwargs):
+        """Run action"""
+        raise NotImplementedError("The run method should be implemented in a subclass.")
diff --git a/metagpt/ext/stanford_town/actions/summarize_conv.py b/metagpt/ext/stanford_town/actions/summarize_conv.py
new file mode 100644
index 000000000..5be5fcaa4
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/summarize_conv.py
@@ -0,0 +1,47 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : summarize the content of agents' conversation
+
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.logs import logger
+
+
+class SummarizeConv(STAction):
+    name: str = "SummarizeConv"
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        resp = False
+        try:
+            _ = self._func_cleanup(llm_resp, prompt)
+            resp = True
+        except Exception:
+            pass
+        return resp
+
+    def _func_cleanup(self, llm_resp: str, prompt: str) -> str:
+        ret = "conversing about " + llm_resp.strip()
+        return ret
+
+    def _func_fail_default_resp(self) -> str:
+        return "conversing with a housemate about morning greetings"
+
+    async def run(self, conv: list):
+        def create_prompt_input(conversation: list):
+            convo_str = ""
+            for row in conversation:
+                convo_str += f'{row[0]}: "{row[1]}"\n'
+            prompt_input = [convo_str]
+            return prompt_input
+
+        prompt_input = create_prompt_input(conv)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "summarize_conversation_v1.txt")
+
+        example_output = "conversing about what to eat for lunch"
+        special_instruction = (
+            "The output must continue the sentence above by filling in the <fill in> tag. "
+            "Don't start with 'this is a conversation about...' Just finish the sentence "
+            "but do not miss any important details (including who are chatting)."
+        )
+        output = await self._run_gpt35(prompt, example_output, special_instruction)
+        logger.info(f"Action: {self.cls_name} output: {output}")
+        return output
diff --git a/metagpt/ext/stanford_town/actions/task_decomp.py b/metagpt/ext/stanford_town/actions/task_decomp.py
new file mode 100644
index 000000000..3a23a7345
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/task_decomp.py
@@ -0,0 +1,173 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : task_decomp
+
+import datetime
+
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.logs import logger
+
+
+class TaskDecomp(STAction):
+    name: str = "TaskDecomp"
+
+    def _func_cleanup(self, llm_resp: str, prompt: str) -> list:
+        # TODO SOMETHING HERE sometimes fails... See screenshot
+        temp = [i.strip() for i in llm_resp.split("\n")]
+        _cr = []
+        cr = []
+        for count, i in enumerate(temp):
+            if count != 0:
+                _cr += [" ".join([j.strip() for j in i.split(" ")][3:])]
+            else:
+                _cr += [i]
+        for count, i in enumerate(_cr):
+            k = [j.strip() for j in i.split("(duration in minutes:")]
+            task = k[0]
+            if task[-1] == ".":
+                task = task[:-1]
+            duration = int(k[1].split(",")[0].strip())
+            cr += [[task, duration]]
+
+        total_expected_min = int(prompt.split("(total duration in minutes")[-1].split("):")[0].strip())
+
+        # TODO -- now, you need to make sure that this is the same as the sum of
+        #         the current action sequence.
+        curr_min_slot = [
+            ["dummy", -1],
+        ]  # (task_name, task_index)
+        for count, i in enumerate(cr):
+            i_task = i[0]
+            i_duration = i[1]
+
+            i_duration -= i_duration % 5
+            if i_duration > 0:
+                for j in range(i_duration):
+                    curr_min_slot += [(i_task, count)]
+        curr_min_slot = curr_min_slot[1:]
+
+        if len(curr_min_slot) > total_expected_min:
+            last_task = curr_min_slot[60]
+            for i in range(1, 6):
+                curr_min_slot[-1 * i] = last_task
+        elif len(curr_min_slot) < total_expected_min:
+            last_task = curr_min_slot[-1]
+            for i in range(total_expected_min - len(curr_min_slot)):
+                curr_min_slot += [last_task]
+
+        cr_ret = [
+            ["dummy", -1],
+        ]
+        for task, task_index in curr_min_slot:
+            if task != cr_ret[-1][0]:
+                cr_ret += [[task, 1]]
+            else:
+                cr_ret[-1][1] += 1
+        cr = cr_ret[1:]
+
+        return cr
+
+    def _func_validate(self, llm_resp: str, prompt: str) -> bool:
+        # TODO -- this sometimes generates error
+        try:
+            self._func_cleanup(llm_resp, prompt)
+        except Exception:
+            return False
+        return True
+
+    def _func_fail_default_resp(self) -> int:
+        fs = [["asleep", 0]]
+        return fs
+
+    async def run(self, role: "STRole", task_desc: int, truncated_act_dur: int, *args, **kwargs):
+        def create_prompt_input(role, task, duration):
+            """
+            Today is Saturday June 25. From 00:00 ~ 06:00am, Maeve is
+            planning on sleeping, 06:00 ~ 07:00am, Maeve is
+            planning on waking up and doing her morning routine,
+            and from 07:00am ~08:00am, Maeve is planning on having breakfast.
+            """
+
+            curr_f_org_index = role.scratch.get_f_daily_schedule_hourly_org_index()
+            all_indices = []
+            # if curr_f_org_index > 0:
+            #   all_indices += [curr_f_org_index-1]
+            all_indices += [curr_f_org_index]
+            if curr_f_org_index + 1 <= len(role.scratch.f_daily_schedule_hourly_org):
+                all_indices += [curr_f_org_index + 1]
+            if curr_f_org_index + 2 <= len(role.scratch.f_daily_schedule_hourly_org):
+                all_indices += [curr_f_org_index + 2]
+
+            curr_time_range = ""
+
+            logger.debug("DEBUG")
+            logger.debug(role.scratch.f_daily_schedule_hourly_org)
+            logger.debug(all_indices)
+
+            summ_str = f'Today is {role.scratch.curr_time.strftime("%B %d, %Y")}. '
+            summ_str += "From "
+            for index in all_indices:
+                logger.debug(f"index {index}")
+                if index < len(role.scratch.f_daily_schedule_hourly_org):
+                    start_min = 0
+                    for i in range(index):
+                        start_min += role.scratch.f_daily_schedule_hourly_org[i][1]
+                        end_min = start_min + role.scratch.f_daily_schedule_hourly_org[index][1]
+                        start_time = datetime.datetime.strptime("00:00:00", "%H:%M:%S") + datetime.timedelta(
+                            minutes=start_min
+                        )
+                        end_time = datetime.datetime.strptime("00:00:00", "%H:%M:%S") + datetime.timedelta(
+                            minutes=end_min
+                        )
+                        start_time_str = start_time.strftime("%H:%M%p")
+                        end_time_str = end_time.strftime("%H:%M%p")
+                        summ_str += (
+                            f"{start_time_str} ~ {end_time_str}, {role.name} is planning "
+                            f"on {role.scratch.f_daily_schedule_hourly_org[index][0]}, "
+                        )
+                        if curr_f_org_index + 1 == index:
+                            curr_time_range = f"{start_time_str} ~ {end_time_str}"
+            summ_str = summ_str[:-2] + "."
+
+            prompt_input = []
+            prompt_input += [role.scratch.get_str_iss()]
+            prompt_input += [summ_str]
+            # prompt_input += [role.scratch.get_str_curr_date_str()]
+            prompt_input += [role.scratch.get_str_firstname()]
+            prompt_input += [role.scratch.get_str_firstname()]
+            prompt_input += [task]
+            prompt_input += [curr_time_range]
+            prompt_input += [duration]
+            prompt_input += [role.scratch.get_str_firstname()]
+            return prompt_input
+
+        prompt_input = create_prompt_input(role, task_desc, truncated_act_dur)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "task_decomp_v3.txt")
+        self.fail_default_resp = self._func_fail_default_resp()
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=1000)
+        logger.info(f"Role: {role.name} {self.cls_name} output: {output}")
+
+        fin_output = []
+        time_sum = 0
+        for i_task, i_duration in output:
+            time_sum += i_duration
+            # HM?????????
+            # if time_sum < duration:
+            if time_sum <= truncated_act_dur:
+                fin_output += [[i_task, i_duration]]
+            else:
+                break
+        ftime_sum = 0
+        for fi_task, fi_duration in fin_output:
+            ftime_sum += fi_duration
+
+        fin_output[-1][1] += truncated_act_dur - ftime_sum
+        output = fin_output
+
+        task_decomp = output
+        ret = []
+        for decomp_task, duration in task_decomp:
+            ret += [[f"{task_desc} ({decomp_task})", duration]]
+        output = ret
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
diff --git a/metagpt/ext/stanford_town/actions/wake_up.py b/metagpt/ext/stanford_town/actions/wake_up.py
new file mode 100644
index 000000000..ea44cd3a4
--- /dev/null
+++ b/metagpt/ext/stanford_town/actions/wake_up.py
@@ -0,0 +1,42 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : wake_up
+
+
+from metagpt.ext.stanford_town.actions.st_action import STAction
+from metagpt.logs import logger
+
+
+class WakeUp(STAction):
+    name: str = "WakeUp"
+
+    def _func_validate(self, llm_resp: str, prompt: str = None) -> bool:
+        try:
+            self._func_cleanup(llm_resp, prompt="")
+        except Exception:
+            return False
+        return True
+
+    def _func_cleanup(self, llm_resp: str, prompt: str) -> int:
+        cr = int(llm_resp.strip().lower().split("am")[0])
+        return cr
+
+    def _func_fail_default_resp(self) -> int:
+        fs = 8
+        return fs
+
+    async def run(self, role: "STRole"):
+        def create_prompt_input(role):
+            prompt_input = [
+                role.scratch.get_str_iss(),
+                role.scratch.get_str_lifestyle(),
+                role.scratch.get_str_firstname(),
+            ]
+            return prompt_input
+
+        prompt_input = create_prompt_input(role)
+        prompt = self.generate_prompt_with_tmpl_filename(prompt_input, "wake_up_hour_v1.txt")
+        self.fail_default_resp = self._func_fail_default_resp()
+        output = await self._run_gpt35_max_tokens(prompt, max_tokens=5)
+        logger.info(f"Role: {role.name} Action: {self.cls_name} output: {output}")
+        return output
diff --git a/metagpt/ext/stanford_town/memory/__init__.py b/metagpt/ext/stanford_town/memory/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/metagpt/ext/stanford_town/memory/agent_memory.py b/metagpt/ext/stanford_town/memory/agent_memory.py
new file mode 100644
index 000000000..d212232f4
--- /dev/null
+++ b/metagpt/ext/stanford_town/memory/agent_memory.py
@@ -0,0 +1,378 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : BasicMemory,AgentMemory实现
+
+from datetime import datetime
+from pathlib import Path
+from typing import Optional
+
+from pydantic import Field, field_serializer, model_validator
+
+from metagpt.logs import logger
+from metagpt.memory.memory import Memory
+from metagpt.schema import Message
+from metagpt.utils.common import read_json_file, write_json_file
+
+
+class BasicMemory(Message):
+    """
+    BasicMemory继承于MG的Message类，其中content属性替代description属性
+    Message类中对于Chat类型支持的非常好，对于Agent个体的Perceive,Reflection,Plan支持的并不多
+    在Type设计上，我们延续GA的三个种类，但是对于Chat种类的对话进行特别设计（具体怎么设计还没想好）
+    """
+
+    memory_id: Optional[str] = Field(default=None)  # 记忆ID
+    memory_count: int = -1  # 第几个记忆，实际数值与Memory相等
+    type_count: int = -1  # 第几种记忆，类型为整数
+    memory_type: Optional[str] = Field(default=None)  # 记忆类型，包含 event,thought,chat三种类型
+    depth: int = -1  # 记忆深度，类型为整数
+    created: Optional[datetime] = Field(default=None)  # 创建时间
+    expiration: Optional[datetime] = Field(default=None)  # 记忆失效时间，默认为空（）
+    last_accessed: Optional[datetime] = Field(default=None)  # 上一次调用的时间，初始化时候与self.created一致
+    subject: Optional[str] = Field(default=None)  # 主语
+    predicate: Optional[str] = Field(default=None)  # 谓语
+    object: Optional[str] = Field(default=None)  # 宾语
+
+    description: Optional[str] = Field(default=None)
+    embedding_key: Optional[str] = Field(default=None)  # 内容与self.content一致
+    poignancy: int = -1  # importance值
+    keywords: list[str] = Field(default=[])  # keywords
+    filling: list = Field(default=[])  # 装的与之相关联的memory_id的列表
+
+    __hash__ = object.__hash__  # support hash in AgentMemory
+
+    @model_validator(mode="before")
+    @classmethod
+    def check_values(cls, values):
+        if "created" in values:
+            values["last_accessed"] = values["created"]
+        if "content" in values:
+            values["description"] = values["content"]
+        if "filling" in values:
+            values["filling"] = values["filling"] or []
+        return values
+
+    @field_serializer("created", "expiration")
+    def transform_time_field(self, time_field: Optional[datetime]) -> str:
+        if time_field:
+            time_field = time_field.strftime("%Y-%m-%d %H:%M:%S")
+        return time_field
+
+    def summary(self):
+        return self.subject, self.predicate, self.object
+
+    def save_to_dict(self) -> dict:
+        """
+        将MemoryBasic类转化为字典，用于存储json文件
+        这里需要注意，cause_by跟GA不兼容，所以需要做一个格式转换
+        """
+        memory_dict = dict()
+        node_id = self.memory_id
+        basic_mem_obj = self.model_dump(
+            include=[
+                "node_count",
+                "type_count",
+                "type",
+                "depth",
+                "created",
+                "expiration",
+                "subject",
+                "predicate",
+                "object",
+                "description",
+                "embedding_key",
+                "poignancy",
+                "keywords",
+                "filling",
+                "cause_by",
+            ]
+        )
+
+        memory_dict[node_id] = basic_mem_obj
+        return memory_dict
+
+
+class AgentMemory(Memory):
+    """
+    GA中主要存储三种JSON
+    1. embedding.json (Dict embedding_key:embedding)
+    2. Node.json (Dict Node_id:Node)
+    3. kw_strength.json
+    """
+
+    storage: list[BasicMemory] = []  # 重写Storage，存储BasicMemory所有节点
+    event_list: list[BasicMemory] = []  # 存储event记忆
+    thought_list: list[BasicMemory] = []  # 存储thought记忆
+    chat_list: list[BasicMemory] = []  # chat-related memory
+
+    event_keywords: dict[str, list[BasicMemory]] = dict()  # 存储keywords
+    thought_keywords: dict[str, list[BasicMemory]] = dict()
+    chat_keywords: dict[str, list[BasicMemory]] = dict()
+
+    kw_strength_event: dict[str, int] = dict()
+    kw_strength_thought: dict[str, int] = dict()
+
+    memory_saved: Optional[Path] = Field(default=None)
+    embeddings: dict[str, list[float]] = dict()
+
+    def set_mem_path(self, memory_saved: Path):
+        self.memory_saved = memory_saved
+        self.load(memory_saved)
+
+    def save(self, memory_saved: Path):
+        """
+        将MemoryBasic类存储为Nodes.json形式。复现GA中的Kw Strength.json形式
+        这里添加一个路径即可
+        TODO 这里在存储时候进行倒序存储，之后需要验证（test_memory通过）
+        """
+        memory_json = dict()
+        for i in range(len(self.storage)):
+            memory_node = self.storage[len(self.storage) - i - 1]
+            memory_node = memory_node.save_to_dict()
+            memory_json.update(memory_node)
+        write_json_file(memory_saved.joinpath("nodes.json"), memory_json)
+        write_json_file(memory_saved.joinpath("embeddings.json"), self.embeddings)
+
+        strength_json = dict()
+        strength_json["kw_strength_event"] = self.kw_strength_event
+        strength_json["kw_strength_thought"] = self.kw_strength_thought
+        write_json_file(memory_saved.joinpath("kw_strength.json"), strength_json)
+
+    def load(self, memory_saved: Path):
+        """
+        将GA的JSON解析，填充到AgentMemory类之中
+        """
+        self.embeddings = read_json_file(memory_saved.joinpath("embeddings.json"))
+        memory_load = read_json_file(memory_saved.joinpath("nodes.json"))
+        for count in range(len(memory_load.keys())):
+            node_id = f"node_{str(count + 1)}"
+            node_details = memory_load[node_id]
+            node_type = node_details["type"]
+            created = datetime.strptime(node_details["created"], "%Y-%m-%d %H:%M:%S")
+            expiration = None
+            if node_details["expiration"]:
+                expiration = datetime.strptime(node_details["expiration"], "%Y-%m-%d %H:%M:%S")
+
+            s = node_details["subject"]
+            p = node_details["predicate"]
+            o = node_details["object"]
+
+            description = node_details["description"]
+            embedding_pair = (node_details["embedding_key"], self.embeddings[node_details["embedding_key"]])
+            poignancy = node_details["poignancy"]
+            keywords = set(node_details["keywords"])
+            filling = node_details["filling"]
+            if node_type == "thought":
+                self.add_thought(
+                    created, expiration, s, p, o, description, keywords, poignancy, embedding_pair, filling
+                )
+            if node_type == "event":
+                self.add_event(created, expiration, s, p, o, description, keywords, poignancy, embedding_pair, filling)
+            if node_type == "chat":
+                self.add_chat(created, expiration, s, p, o, description, keywords, poignancy, embedding_pair, filling)
+
+        strength_keywords_load = read_json_file(memory_saved.joinpath("kw_strength.json"))
+        if strength_keywords_load["kw_strength_event"]:
+            self.kw_strength_event = strength_keywords_load["kw_strength_event"]
+        if strength_keywords_load["kw_strength_thought"]:
+            self.kw_strength_thought = strength_keywords_load["kw_strength_thought"]
+
+    def add(self, memory_basic: BasicMemory):
+        """
+        Add a new message to storage, while updating the index
+        重写add方法，修改原有的Message类为BasicMemory类，并添加不同的记忆类型添加方式
+        """
+        if memory_basic.memory_id in self.storage:
+            return
+        self.storage.append(memory_basic)
+        if memory_basic.memory_type == "chat":
+            self.chat_list[0:0] = [memory_basic]
+            return
+        if memory_basic.memory_type == "thought":
+            self.thought_list[0:0] = [memory_basic]
+            return
+        if memory_basic.memory_type == "event":
+            self.event_list[0:0] = [memory_basic]
+            return
+
+    def add_chat(
+        self, created, expiration, s, p, o, content, keywords, poignancy, embedding_pair, filling, cause_by=""
+    ):
+        """
+        调用add方法，初始化chat，在创建的时候就需要调用embedding函数
+        """
+        memory_count = len(self.storage) + 1
+        type_count = len(self.thought_list) + 1
+        memory_type = "chat"
+        memory_id = f"node_{str(memory_count)}"
+        depth = 1
+
+        memory_node = BasicMemory(
+            memory_id=memory_id,
+            memory_count=memory_count,
+            type_count=type_count,
+            memory_type=memory_type,
+            depth=depth,
+            created=created,
+            expiration=expiration,
+            subject=s,
+            predicate=p,
+            object=o,
+            description=content,
+            embedding_key=embedding_pair[0],
+            poignancy=poignancy,
+            keywords=keywords,
+            filling=filling,
+            cause_by=cause_by,
+        )
+
+        keywords = [i.lower() for i in keywords]
+        for kw in keywords:
+            if kw in self.chat_keywords:
+                self.chat_keywords[kw][0:0] = [memory_node]
+            else:
+                self.chat_keywords[kw] = [memory_node]
+
+        self.add(memory_node)
+
+        self.embeddings[embedding_pair[0]] = embedding_pair[1]
+        return memory_node
+
+    def add_thought(self, created, expiration, s, p, o, content, keywords, poignancy, embedding_pair, filling):
+        """
+        调用add方法，初始化thought
+        """
+        memory_count = len(self.storage) + 1
+        type_count = len(self.thought_list) + 1
+        memory_type = "thought"
+        memory_id = f"node_{str(memory_count)}"
+        depth = 1
+
+        try:
+            if filling:
+                depth_list = [memory_node.depth for memory_node in self.storage if memory_node.memory_id in filling]
+                depth += max(depth_list)
+        except Exception as exp:
+            logger.warning(f"filling init occur {exp}")
+            pass
+
+        memory_node = BasicMemory(
+            memory_id=memory_id,
+            memory_count=memory_count,
+            type_count=type_count,
+            memory_type=memory_type,
+            depth=depth,
+            created=created,
+            expiration=expiration,
+            subject=s,
+            predicate=p,
+            object=o,
+            description=content,
+            embedding_key=embedding_pair[0],
+            poignancy=poignancy,
+            keywords=keywords,
+            filling=filling,
+        )
+
+        keywords = [i.lower() for i in keywords]
+        for kw in keywords:
+            if kw in self.thought_keywords:
+                self.thought_keywords[kw][0:0] = [memory_node]
+            else:
+                self.thought_keywords[kw] = [memory_node]
+
+        self.add(memory_node)
+
+        if f"{p} {o}" != "is idle":
+            for kw in keywords:
+                if kw in self.kw_strength_thought:
+                    self.kw_strength_thought[kw] += 1
+                else:
+                    self.kw_strength_thought[kw] = 1
+
+        self.embeddings[embedding_pair[0]] = embedding_pair[1]
+        return memory_node
+
+    def add_event(self, created, expiration, s, p, o, content, keywords, poignancy, embedding_pair, filling):
+        """
+        调用add方法，初始化event
+        """
+        memory_count = len(self.storage) + 1
+        type_count = len(self.event_list) + 1
+        memory_type = "event"
+        memory_id = f"node_{str(memory_count)}"
+        depth = 0
+
+        if "(" in content:
+            content = " ".join(content.split()[:3]) + " " + content.split("(")[-1][:-1]
+
+        memory_node = BasicMemory(
+            memory_id=memory_id,
+            memory_count=memory_count,
+            type_count=type_count,
+            memory_type=memory_type,
+            depth=depth,
+            created=created,
+            expiration=expiration,
+            subject=s,
+            predicate=p,
+            object=o,
+            description=content,
+            embedding_key=embedding_pair[0],
+            poignancy=poignancy,
+            keywords=keywords,
+            filling=filling,
+        )
+
+        keywords = [i.lower() for i in keywords]
+        for kw in keywords:
+            if kw in self.event_keywords:
+                self.event_keywords[kw][0:0] = [memory_node]
+            else:
+                self.event_keywords[kw] = [memory_node]
+
+        self.add(memory_node)
+
+        if f"{p} {o}" != "is idle":
+            for kw in keywords:
+                if kw in self.kw_strength_event:
+                    self.kw_strength_event[kw] += 1
+                else:
+                    self.kw_strength_event[kw] = 1
+
+        self.embeddings[embedding_pair[0]] = embedding_pair[1]
+        return memory_node
+
+    def get_summarized_latest_events(self, retention):
+        ret_set = set()
+        for e_node in self.event_list[:retention]:
+            ret_set.add(e_node.summary())
+        return ret_set
+
+    def get_last_chat(self, target_role_name: str):
+        if target_role_name.lower() in self.chat_keywords:
+            return self.chat_keywords[target_role_name.lower()][0]
+        else:
+            return False
+
+    def retrieve_relevant_thoughts(self, s_content: str, p_content: str, o_content: str) -> set:
+        contents = [s_content, p_content, o_content]
+
+        ret = []
+        for i in contents:
+            if i in self.thought_keywords:
+                ret += self.thought_keywords[i.lower()]
+
+        ret = set(ret)
+        return ret
+
+    def retrieve_relevant_events(self, s_content: str, p_content: str, o_content: str) -> set:
+        contents = [s_content, p_content, o_content]
+
+        ret = []
+        for i in contents:
+            if i in self.event_keywords:
+                ret += self.event_keywords[i]
+
+        ret = set(ret)
+        return ret
diff --git a/metagpt/ext/stanford_town/memory/retrieve.py b/metagpt/ext/stanford_town/memory/retrieve.py
new file mode 100644
index 000000000..c4b32f965
--- /dev/null
+++ b/metagpt/ext/stanford_town/memory/retrieve.py
@@ -0,0 +1,180 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : Retrieve函数实现
+
+import datetime
+
+from numpy import dot
+from numpy.linalg import norm
+
+from metagpt.ext.stanford_town.memory.agent_memory import BasicMemory
+from metagpt.ext.stanford_town.utils.utils import get_embedding
+
+
+def agent_retrieve(
+    agent_memory,
+    curr_time: datetime.datetime,
+    memory_forget: float,
+    query: str,
+    nodes: list[BasicMemory],
+    topk: int = 4,
+) -> list[BasicMemory]:
+    """
+    Retrieve需要集合Role使用,原因在于Role才具有AgentMemory,scratch
+    逻辑:Role调用该函数,self.rc.AgentMemory,self.rc.scratch.curr_time,self.rc.scratch.memory_forget
+    输入希望查询的内容与希望回顾的条数,返回TopK条高分记忆，即List[BasicMemory]
+
+    Score_lists示例
+    {
+        "memory": memories[i],             BasicMemory类
+        "importance": memories[i].poignancy
+        "recency": 衰减因子计算结果
+        "relevance": 搜索结果
+    }
+    """
+    memories = nodes
+    agent_memory_embedding = agent_memory.embeddings
+    memories = sorted(memories, key=lambda memory_node: memory_node.last_accessed, reverse=True)
+
+    score_list = []
+    score_list = extract_importance(memories, score_list)
+    score_list = extract_recency(curr_time, memory_forget, score_list)
+    score_list = extract_relevance(agent_memory_embedding, query, score_list)
+    score_list = normalize_score_floats(score_list, 0, 1)
+
+    total_dict = {}
+    gw = [1, 1, 1]  # 三个因素的权重,重要性,近因性,相关性,
+    for i in range(len(score_list)):
+        total_score = (
+            score_list[i]["importance"] * gw[0] + score_list[i]["recency"] * gw[1] + score_list[i]["relevance"] * gw[2]
+        )
+        total_dict[score_list[i]["memory"].memory_id] = total_score
+
+    result = top_highest_x_values(total_dict, topk)
+
+    return result  # 返回的是一个BasicMemory列表
+
+
+def new_agent_retrieve(role, focus_points: list, n_count=30) -> dict:
+    """
+    输入为role，关注点列表,返回记忆数量
+    输出为字典，键为focus_point，值为对应的记忆列表
+    """
+    retrieved = dict()
+    for focal_pt in focus_points:
+        nodes = [
+            [i.last_accessed, i]
+            for i in role.memory.event_list + role.memory.thought_list
+            if "idle" not in i.embedding_key
+        ]
+        nodes = sorted(nodes, key=lambda x: x[0])
+        nodes = [i for created, i in nodes]
+        results = agent_retrieve(
+            role.memory, role.scratch.curr_time, role.scratch.recency_decay, focal_pt, nodes, n_count
+        )
+        final_result = []
+        for n in results:
+            for i in role.memory.storage:
+                if i.memory_id == n:
+                    i.last_accessed = role.scratch.curr_time
+                    final_result.append(i)
+
+        retrieved[focal_pt] = final_result
+
+    return retrieved
+
+
+def top_highest_x_values(d, x):
+    """
+    输入字典，Topx
+    返回以字典值排序，字典键组成的List[BasicMemory]
+    """
+    top_v = [item[0] for item in sorted(d.items(), key=lambda item: item[1], reverse=True)[:x]]
+    return top_v
+
+
+def extract_importance(memories, score_list):
+    """
+    抽取重要性
+    """
+    for i in range(len(memories)):
+        score = {"memory": memories[i], "importance": memories[i].poignancy}
+        score_list.append(score)
+    return score_list
+
+
+def extract_relevance(agent_memory_embedding, query, score_list):
+    """
+    抽取相关性
+    """
+    query_embedding = get_embedding(query)
+    # 进行
+    for i in range(len(score_list)):
+        node_embedding = agent_memory_embedding[score_list[i]["memory"].embedding_key]
+        result = cos_sim(node_embedding, query_embedding)
+        score_list[i]["relevance"] = result
+
+    return score_list
+
+
+def extract_recency(curr_time, memory_forget, score_list):
+    """
+    抽取近因性，目前使用的现实世界过一天走一个衰减因子
+    """
+    for i in range(len(score_list)):
+        day_count = (curr_time - score_list[i]["memory"].created).days
+        score_list[i]["recency"] = memory_forget**day_count
+    return score_list
+
+
+def cos_sim(a, b):
+    """
+    计算余弦相似度
+    """
+    return dot(a, b) / (norm(a) * norm(b))
+
+
+def normalize_list_floats(single_list, target_min, target_max):
+    """
+    单个列表归一化
+    """
+    if len(single_list) == 0:
+        return []
+
+    min_val = min(single_list)
+    max_val = max(single_list)
+    range_val = max_val - min_val
+
+    if range_val == 0:
+        for i in range(len(single_list)):
+            single_list[i] = (target_max - target_min) / 2
+    else:
+        for i in range(len(single_list)):
+            single_list[i] = (single_list[i] - min_val) * (target_max - target_min) / range_val + target_min
+    return single_list
+
+
+def normalize_score_floats(score_list, target_min, target_max):
+    """
+    整体归一化
+    """
+    importance_list = []
+    relevance_list = []
+    recency_list = []
+
+    for i in range(len(score_list)):
+        importance_list.append(score_list[i]["importance"])
+        relevance_list.append(score_list[i]["relevance"])
+        recency_list.append(score_list[i]["recency"])
+
+    # 进行归一化操作
+    importance_list = normalize_list_floats(importance_list, target_min, target_max)
+    relevance_list = normalize_list_floats(relevance_list, target_min, target_max)
+    recency_list = normalize_list_floats(recency_list, target_min, target_max)
+
+    for i in range(len(score_list)):
+        score_list[i]["importance"] = importance_list[i]
+        score_list[i]["relevance"] = relevance_list[i]
+        score_list[i]["recency"] = recency_list[i]
+
+    return score_list
diff --git a/metagpt/ext/stanford_town/memory/scratch.py b/metagpt/ext/stanford_town/memory/scratch.py
new file mode 100644
index 000000000..b4036f839
--- /dev/null
+++ b/metagpt/ext/stanford_town/memory/scratch.py
@@ -0,0 +1,383 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : Scratch类实现（角色信息类）
+
+from datetime import datetime, timedelta
+from pathlib import Path
+from typing import Optional, Union
+
+from pydantic import BaseModel, Field, field_serializer, field_validator
+
+from metagpt.utils.common import read_json_file, write_json_file
+
+
+class Scratch(BaseModel):
+    # 类别1:人物超参
+    vision_r: int = 4
+    att_bandwidth: int = 3
+    retention: int = 5
+
+    # 类别2:世界信息
+    curr_time: Optional[datetime] = Field(default=None)
+    curr_tile: Optional[list[int]] = Field(default=None)
+    daily_plan_req: Optional[str] = Field(default=None)
+
+    # 类别3:人物角色的核心身份
+    name: Optional[str] = Field(default=None)
+    first_name: Optional[str] = Field(default=None)
+    last_name: Optional[str] = Field(default=None)
+    age: Optional[int] = Field(default=None)
+    innate: Optional[str] = Field(default=None)  # L0 permanent core traits.
+    learned: Optional[str] = Field(default=None)  # L1 stable traits.
+    currently: Optional[str] = Field(default=None)  # L2 external implementation.
+    lifestyle: Optional[str] = Field(default=None)
+    living_area: Optional[str] = Field(default=None)
+
+    # 类别4:旧反思变量
+    concept_forget: int = 100
+    daily_reflection_time: int = 60 * 3
+    daily_reflection_size: int = 5
+    overlap_reflect_th: int = 2
+    kw_strg_event_reflect_th: int = 4
+    kw_strg_thought_reflect_th: int = 4
+
+    # 类别5:新反思变量
+    recency_w: int = 1
+    relevance_w: int = 1
+    importance_w: int = 1
+    recency_decay: float = 0.99
+    importance_trigger_max: int = 150
+    importance_trigger_curr: int = 150
+    importance_ele_n: int = 0
+    thought_count: int = 5
+
+    # 类别6:个人计划
+    daily_req: list[str] = Field(default=[])
+    f_daily_schedule: list[list[Union[int, str]]] = Field(default=[])
+    f_daily_schedule_hourly_org: list[list[Union[int, str]]] = Field(default=[])
+
+    # 类别7:当前动作
+    act_address: Optional[str] = Field(default=None)
+    act_start_time: Optional[datetime] = Field(default=None)
+    act_duration: Optional[int] = Field(default=None)
+    act_description: Optional[str] = Field(default=None)
+    act_pronunciatio: Optional[str] = Field(default=None)
+    act_event: list[Optional[str]] = [None, None, None]
+
+    act_obj_description: Optional[str] = Field(default=None)
+    act_obj_pronunciatio: Optional[str] = Field(default=None)
+    act_obj_event: list[Optional[str]] = [None, None, None]
+
+    chatting_with: Optional[str] = Field(default=None)
+    chat: Optional[str] = Field(default=None)
+    chatting_with_buffer: dict = dict()
+    chatting_end_time: Optional[datetime] = Field(default=None)
+
+    act_path_set: bool = False
+    planned_path: list[list[int]] = Field(default=[])
+
+    @field_validator("curr_time", "act_start_time", "chatting_end_time", mode="before")
+    @classmethod
+    def check_time_filed(cls, time_filed):
+        val = datetime.strptime(time_filed, "%B %d, %Y, %H:%M:%S") if time_filed else None
+        return val
+
+    @field_serializer("curr_time", "act_start_time", "chatting_end_time")
+    def transform_time_field(self, time_filed: Optional[datetime]) -> str:
+        if time_filed:
+            time_filed = time_filed.strftime("%B %d, %Y, %H:%M:%S")
+        return time_filed
+
+    @classmethod
+    def init_scratch_from_path(cls, f_saved: Path):
+        scratch_load = read_json_file(f_saved)
+        scratch = Scratch(**scratch_load)
+        return scratch
+
+    def save(self, out_json: Path):
+        """
+        Save persona's scratch.
+
+        INPUT:
+          out_json: The file where we wil be saving our persona's state.
+        OUTPUT:
+          None
+        """
+        scratch = self.model_dump()
+        write_json_file(out_json, scratch, encoding="utf-8")
+
+    def get_f_daily_schedule_index(self, advance=0):
+        """
+        We get the current index of self.f_daily_schedule.
+
+        Recall that self.f_daily_schedule stores the decomposed action sequences
+        up until now, and the hourly sequences of the future action for the rest
+        of today. Given that self.f_daily_schedule is a list of list where the
+        inner list is composed of [task, duration], we continue to add up the
+        duration until we reach "if elapsed > today_min_elapsed" condition. The
+        index where we stop is the index we will return.
+
+        INPUT
+          advance: Integer value of the number minutes we want to look into the
+                   future. This allows us to get the index of a future timeframe.
+        OUTPUT
+          an integer value for the current index of f_daily_schedule.
+        """
+        # We first calculate teh number of minutes elapsed today.
+        today_min_elapsed = 0
+        today_min_elapsed += self.curr_time.hour * 60
+        today_min_elapsed += self.curr_time.minute
+        today_min_elapsed += advance
+
+        x = 0
+        for task, duration in self.f_daily_schedule:
+            x += duration
+        x = 0
+        for task, duration in self.f_daily_schedule_hourly_org:
+            x += duration
+
+        # We then calculate the current index based on that.
+        curr_index = 0
+        elapsed = 0
+        for task, duration in self.f_daily_schedule:
+            elapsed += duration
+            if elapsed > today_min_elapsed:
+                return curr_index
+            curr_index += 1
+
+        return curr_index
+
+    def get_f_daily_schedule_hourly_org_index(self, advance=0):
+        """
+        We get the current index of self.f_daily_schedule_hourly_org.
+        It is otherwise the same as get_f_daily_schedule_index.
+
+        INPUT
+          advance: Integer value of the number minutes we want to look into the
+                   future. This allows us to get the index of a future timeframe.
+        OUTPUT
+          an integer value for the current index of f_daily_schedule.
+        """
+        # We first calculate teh number of minutes elapsed today.
+        today_min_elapsed = 0
+        today_min_elapsed += self.curr_time.hour * 60
+        today_min_elapsed += self.curr_time.minute
+        today_min_elapsed += advance
+        # We then calculate the current index based on that.
+        curr_index = 0
+        elapsed = 0
+        for task, duration in self.f_daily_schedule_hourly_org:
+            elapsed += duration
+            if elapsed > today_min_elapsed:
+                return curr_index
+            curr_index += 1
+        return curr_index
+
+    def get_str_iss(self):
+        """
+        ISS stands for "identity stable set." This describes the commonset summary
+        of this persona -- basically, the bare minimum description of the persona
+        that gets used in almost all prompts that need to call on the persona.
+
+        INPUT
+          None
+        OUTPUT
+          the identity stable set summary of the persona in a string form.
+        EXAMPLE STR OUTPUT
+          "Name: Dolores Heitmiller
+           Age: 28
+           Innate traits: hard-edged, independent, loyal
+           Learned traits: Dolores is a painter who wants live quietly and paint
+             while enjoying her everyday life.
+           Currently: Dolores is preparing for her first solo show. She mostly
+             works from home.
+           Lifestyle: Dolores goes to bed around 11pm, sleeps for 7 hours, eats
+             dinner around 6pm.
+           Daily plan requirement: Dolores is planning to stay at home all day and
+             never go out."
+        """
+        commonset = ""
+        commonset += f"Name: {self.name}\n"
+        commonset += f"Age: {self.age}\n"
+        commonset += f"Innate traits: {self.innate}\n"
+        commonset += f"Learned traits: {self.learned}\n"
+        commonset += f"Currently: {self.currently}\n"
+        commonset += f"Lifestyle: {self.lifestyle}\n"
+        commonset += f"Daily plan requirement: {self.daily_plan_req}\n"
+        commonset += f"Current Date: {self.curr_time.strftime('%A %B %d') if self.curr_time else ''}\n"
+        return commonset
+
+    def get_str_name(self):
+        return self.name
+
+    def get_str_firstname(self):
+        return self.first_name
+
+    def get_str_lastname(self):
+        return self.last_name
+
+    def get_str_age(self):
+        return str(self.age)
+
+    def get_str_innate(self):
+        return self.innate
+
+    def get_str_learned(self):
+        return self.learned
+
+    def get_str_currently(self):
+        return self.currently
+
+    def get_str_lifestyle(self):
+        return self.lifestyle
+
+    def get_str_daily_plan_req(self):
+        return self.daily_plan_req
+
+    def get_str_curr_date_str(self):
+        return self.curr_time.strftime("%A %B %d")
+
+    def get_curr_event(self):
+        if not self.act_address:
+            return self.name, None, None
+        else:
+            return self.act_event
+
+    def get_curr_event_and_desc(self):
+        if not self.act_address:
+            return self.name, None, None, None
+        else:
+            return self.act_event[0], self.act_event[1], self.act_event[2], self.act_description
+
+    def get_curr_obj_event_and_desc(self):
+        if not self.act_address:
+            return "", None, None, None
+        else:
+            return self.act_address, self.act_obj_event[1], self.act_obj_event[2], self.act_obj_description
+
+    def add_new_action(
+        self,
+        action_address,
+        action_duration,
+        action_description,
+        action_pronunciatio,
+        action_event,
+        chatting_with,
+        chat,
+        chatting_with_buffer,
+        chatting_end_time,
+        act_obj_description,
+        act_obj_pronunciatio,
+        act_obj_event,
+        act_start_time=None,
+    ):
+        self.act_address = action_address
+        self.act_duration = action_duration
+        self.act_description = action_description
+        self.act_pronunciatio = action_pronunciatio
+        self.act_event = action_event
+
+        self.chatting_with = chatting_with
+        self.chat = chat
+        if chatting_with_buffer:
+            self.chatting_with_buffer.update(chatting_with_buffer)
+        self.chatting_end_time = chatting_end_time
+
+        self.act_obj_description = act_obj_description
+        self.act_obj_pronunciatio = act_obj_pronunciatio
+        self.act_obj_event = act_obj_event
+
+        self.act_start_time = self.curr_time
+
+        self.act_path_set = False
+
+    def act_time_str(self):
+        """
+        Returns a string output of the current time.
+
+        INPUT
+          None
+        OUTPUT
+          A string output of the current time.
+        EXAMPLE STR OUTPUT
+          "14:05 P.M."
+        """
+        return self.act_start_time.strftime("%H:%M %p")
+
+    def act_check_finished(self):
+        """
+        Checks whether the self.Action instance has finished.
+
+        INPUT
+          curr_datetime: Current time. If current time is later than the action's
+                         start time + its duration, then the action has finished.
+        OUTPUT
+          Boolean [True]: Action has finished.
+          Boolean [False]: Action has not finished and is still ongoing.
+        """
+        if not self.act_address:
+            return True
+
+        if self.chatting_with:
+            end_time = self.chatting_end_time
+        else:
+            x = self.act_start_time
+            if x.second != 0:
+                x = x.replace(second=0)
+                x = x + timedelta(minutes=1)
+            end_time = x + timedelta(minutes=self.act_duration)
+
+        if end_time.strftime("%H:%M:%S") == self.curr_time.strftime("%H:%M:%S"):
+            return True
+        return False
+
+    def act_summarize(self):
+        """
+        Summarize the current action as a dictionary.
+
+        INPUT
+          None
+        OUTPUT
+          ret: A human readable summary of the action.
+        """
+        exp = dict()
+        exp["persona"] = self.name
+        exp["address"] = self.act_address
+        exp["start_datetime"] = self.act_start_time
+        exp["duration"] = self.act_duration
+        exp["description"] = self.act_description
+        exp["pronunciatio"] = self.act_pronunciatio
+        return exp
+
+    def act_summary_str(self):
+        """
+        Returns a string summary of the current action. Meant to be
+        human-readable.
+
+        INPUT
+          None
+        OUTPUT
+          ret: A human readable summary of the action.
+        """
+        start_datetime_str = self.act_start_time.strftime("%A %B %d -- %H:%M %p")
+        ret = f"[{start_datetime_str}]\n"
+        ret += f"Activity: {self.name} is {self.act_description}\n"
+        ret += f"Address: {self.act_address}\n"
+        ret += f"Duration in minutes (e.g., x min): {str(self.act_duration)} min\n"
+        return ret
+
+    def get_daily_schedule(self, daily_schedule: list[list[str]]):
+        ret = ""
+        curr_min_sum = 0
+        for row in daily_schedule:
+            curr_min_sum += row[1]
+            hour = int(curr_min_sum / 60)
+            minute = curr_min_sum % 60
+            ret += f"{hour:02}:{minute:02} || {row[0]}\n"
+        return ret
+
+    def get_str_daily_schedule_summary(self):
+        return self.get_daily_schedule(self.f_daily_schedule)
+
+    def get_str_daily_schedule_hourly_org_summary(self):
+        return self.get_daily_schedule(self.f_daily_schedule_hourly_org)
diff --git a/metagpt/ext/stanford_town/memory/spatial_memory.py b/metagpt/ext/stanford_town/memory/spatial_memory.py
new file mode 100644
index 000000000..71b856907
--- /dev/null
+++ b/metagpt/ext/stanford_town/memory/spatial_memory.py
@@ -0,0 +1,116 @@
+"""
+Author: Joon Sung Park (joonspk@stanford.edu)
+
+File: spatial_memory.py
+Description: Defines the MemoryTree class that serves as the agents' spatial
+memory that aids in grounding their behavior in the game world.
+"""
+from pathlib import Path
+
+from pydantic import BaseModel, Field
+
+from metagpt.logs import logger
+from metagpt.utils.common import read_json_file, write_json_file
+
+
+class MemoryTree(BaseModel):
+    tree: dict = Field(default=dict)
+
+    def set_mem_path(self, f_saved: Path):
+        self.tree = read_json_file(f_saved)
+
+    def print_tree(self) -> None:
+        def _print_tree(tree, depth):
+            dash = " >" * depth
+            if isinstance(tree, list):
+                if tree:
+                    logger.info(f"{dash} {tree}")
+                return
+
+            for key, val in tree.items():
+                if key:
+                    logger.info(f"{dash} {tree}")
+                _print_tree(val, depth + 1)
+
+        _print_tree(self.tree, 0)
+
+    def save(self, out_json: Path) -> None:
+        write_json_file(out_json, self.tree)
+
+    def get_str_accessible_sectors(self, curr_world: str) -> str:
+        """
+        Returns a summary string of all the arenas that the persona can access
+        within the current sector.
+
+        Note that there are places a given persona cannot enter. This information
+        is provided in the persona sheet. We account for this in this function.
+
+        INPUT
+          None
+        OUTPUT
+          A summary string of all the arenas that the persona can access.
+        EXAMPLE STR OUTPUT
+          "bedroom, kitchen, dining room, office, bathroom"
+        """
+        x = ", ".join(list(self.tree[curr_world].keys()))
+        return x
+
+    def get_str_accessible_sector_arenas(self, sector: str) -> str:
+        """
+        Returns a summary string of all the arenas that the persona can access
+        within the current sector.
+
+        Note that there are places a given persona cannot enter. This information
+        is provided in the persona sheet. We account for this in this function.
+
+        INPUT
+          None
+        OUTPUT
+          A summary string of all the arenas that the persona can access.
+        EXAMPLE STR OUTPUT
+          "bedroom, kitchen, dining room, office, bathroom"
+        """
+        curr_world, curr_sector = sector.split(":")
+        if not curr_sector:
+            return ""
+        x = ", ".join(list(self.tree[curr_world][curr_sector].keys()))
+        return x
+
+    def get_str_accessible_arena_game_objects(self, arena: str) -> str:
+        """
+        Get a str list of all accessible game objects that are in the arena. If
+        temp_address is specified, we return the objects that are available in
+        that arena, and if not, we return the objects that are in the arena our
+        persona is currently in.
+
+        INPUT
+          temp_address: optional arena address
+        OUTPUT
+          str list of all accessible game objects in the gmae arena.
+        EXAMPLE STR OUTPUT
+          "phone, charger, bed, nightstand"
+        """
+        curr_world, curr_sector, curr_arena = arena.split(":")
+
+        if not curr_arena:
+            return ""
+
+        try:
+            x = ", ".join(list(self.tree[curr_world][curr_sector][curr_arena]))
+        except Exception:
+            x = ", ".join(list(self.tree[curr_world][curr_sector][curr_arena.lower()]))
+        return x
+
+    def add_tile_info(self, tile_info: dict) -> None:
+        if tile_info["world"]:
+            if tile_info["world"] not in self.tree:
+                self.tree[tile_info["world"]] = {}
+        if tile_info["sector"]:
+            if tile_info["sector"] not in self.tree[tile_info["world"]]:
+                self.tree[tile_info["world"]][tile_info["sector"]] = {}
+        if tile_info["arena"]:
+            if tile_info["arena"] not in self.tree[tile_info["world"]][tile_info["sector"]]:
+                self.tree[tile_info["world"]][tile_info["sector"]][tile_info["arena"]] = []
+        if tile_info["game_object"]:
+            if tile_info["game_object"] not in self.tree[tile_info["world"]][tile_info["sector"]][tile_info["arena"]]:
+                self.tree[tile_info["world"]][tile_info["sector"]][tile_info["arena"]] += [tile_info["game_object"]]
diff --git a/metagpt/ext/stanford_town/plan/__init__.py b/metagpt/ext/stanford_town/plan/__init__.py
new file mode 100644
index 000000000..2bcf8efd0
--- /dev/null
+++ b/metagpt/ext/stanford_town/plan/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/metagpt/ext/stanford_town/plan/converse.py b/metagpt/ext/stanford_town/plan/converse.py
new file mode 100644
index 000000000..8eefbc9b4
--- /dev/null
+++ b/metagpt/ext/stanford_town/plan/converse.py
@@ -0,0 +1,93 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : conversation between two agents
+
+from typing import Tuple
+
+from metagpt.ext.stanford_town.actions.agent_chat_sum_rel import AgentChatSumRel
+from metagpt.ext.stanford_town.actions.gen_iter_chat_utt import GenIterChatUTT
+from metagpt.ext.stanford_town.memory.retrieve import new_agent_retrieve
+from metagpt.logs import logger
+
+
+async def agent_conversation(init_role: "STRole", target_role: "STRole", conv_rounds: int = 8) -> list[list[str]]:
+    curr_chat = []
+    logger.info(f"Role: {init_role.name} starts a conversation with Role: {target_role.name}")
+
+    for idx in range(conv_rounds):
+        logger.info(f"Conv round: {idx} between {init_role.name} and {target_role.name}")
+        scratch = init_role.rc.scratch
+        target_scratch = target_role.rc.scratch
+
+        focal_points = [f"{target_scratch.name}"]
+        retrieved = new_agent_retrieve(init_role, focal_points, 50)
+        relationship = await generate_summarize_agent_relationship(init_role, target_role, retrieved)
+        logger.info(f"The relationship between {init_role.name} and {target_role.name}: {relationship}")
+        last_chat = ""
+        for i in curr_chat[-4:]:
+            last_chat += ": ".join(i) + "\n"
+        if last_chat:
+            focal_points = [f"{relationship}", f"{target_scratch.name} is {target_scratch.act_description}", last_chat]
+        else:
+            focal_points = [f"{relationship}", f"{target_scratch.name} is {target_scratch.act_description}"]
+        retrieved = new_agent_retrieve(init_role, focal_points, 15)
+        utt, end = await generate_one_utterance(init_role, target_role, retrieved, curr_chat)
+
+        curr_chat += [[scratch.name, utt]]
+        if end:
+            break
+
+        focal_points = [f"{scratch.name}"]
+        retrieved = new_agent_retrieve(target_role, focal_points, 50)
+        relationship = await generate_summarize_agent_relationship(target_role, init_role, retrieved)
+        logger.info(f"The relationship between {target_role.name} and {init_role.name}: {relationship}")
+        last_chat = ""
+        for i in curr_chat[-4:]:
+            last_chat += ": ".join(i) + "\n"
+        if last_chat:
+            focal_points = [f"{relationship}", f"{scratch.name} is {scratch.act_description}", last_chat]
+        else:
+            focal_points = [f"{relationship}", f"{scratch.name} is {scratch.act_description}"]
+        retrieved = new_agent_retrieve(target_role, focal_points, 15)
+        utt, end = await generate_one_utterance(target_role, init_role, retrieved, curr_chat)
+
+        curr_chat += [[target_scratch.name, utt]]
+        if end:
+            break
+
+    logger.warning(f"Conversations between {target_role.name} and {init_role.name}:")
+    for row in curr_chat:
+        logger.info(row)
+
+    return curr_chat
+
+
+async def generate_summarize_agent_relationship(init_role: "STRole", target_role: "STRole", retrieved: dict) -> str:
+    all_embedding_keys = list()
+    for key, val in retrieved.items():
+        for i in val:
+            all_embedding_keys += [i.embedding_key]
+    all_embedding_key_str = ""
+    for i in all_embedding_keys:
+        all_embedding_key_str += f"{i}\n"
+
+    summarized_relationship = await AgentChatSumRel().run(init_role, target_role, all_embedding_key_str)
+    return summarized_relationship
+
+
+async def generate_one_utterance(init_role, target_role, retrieved: dict, curr_chat: list) -> Tuple[str, str]:
+    # Chat version optimized for speed via batch generation
+    scratch = init_role.rc.scratch
+    target_scratch = target_role.rc.scratch
+    curr_context = (
+        f"{scratch.name} "
+        + f"was {scratch.act_description} "
+        + f"when {scratch.name} "
+        + f"saw {target_scratch.name} "
+        + f"in the middle of {target_scratch.act_description}.\n"
+    )
+    curr_context += f"{scratch.name} " + "is initiating a conversation with " + f"{target_scratch.name}."
+
+    x = await GenIterChatUTT().run(init_role, target_role, retrieved, curr_context, curr_chat)
+
+    return x["utterance"], x["end"]
diff --git a/metagpt/ext/stanford_town/plan/st_plan.py b/metagpt/ext/stanford_town/plan/st_plan.py
new file mode 100644
index 000000000..f63052fc5
--- /dev/null
+++ b/metagpt/ext/stanford_town/plan/st_plan.py
@@ -0,0 +1,706 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : st' planning execution
+
+import datetime
+import math
+import random
+from typing import Tuple, Union
+
+from metagpt.ext.stanford_town.actions.decide_to_talk import DecideToTalk
+from metagpt.ext.stanford_town.actions.gen_action_details import GenActionDetails
+from metagpt.ext.stanford_town.actions.gen_daily_schedule import GenDailySchedule
+from metagpt.ext.stanford_town.actions.gen_hourly_schedule import GenHourlySchedule
+from metagpt.ext.stanford_town.actions.new_decomp_schedule import NewDecompSchedule
+from metagpt.ext.stanford_town.actions.summarize_conv import SummarizeConv
+from metagpt.ext.stanford_town.actions.task_decomp import TaskDecomp
+from metagpt.ext.stanford_town.actions.wake_up import WakeUp
+from metagpt.ext.stanford_town.memory.retrieve import new_agent_retrieve
+from metagpt.ext.stanford_town.plan.converse import agent_conversation
+from metagpt.ext.stanford_town.utils.utils import get_embedding
+from metagpt.llm import LLM
+from metagpt.logs import logger
+
+
+async def plan(role: "STRole", roles: dict["STRole"], new_day: bool, retrieved: dict) -> str:
+    # PART 1: Generate the hourly schedule.
+    if new_day:
+        await _long_term_planning(role, new_day)
+
+    # PART 2: If the current action has expired, we want to create a new plan.
+    act_check_finished = role.scratch.act_check_finished()
+    logger.info(f"Role: {role.name} act_check_finished is {act_check_finished}")
+    if act_check_finished:
+        await _determine_action(role)
+
+    # PART 3: If you perceived an event that needs to be responded to (saw
+    # another role), and retrieved relevant information.
+    # Step 1: Retrieved may have multiple events represented in it. The first
+    #         job here is to determine which of the events we want to focus
+    #         on for the role.
+    #         <focused_event> takes the form of a dictionary like this:
+    #         dictionary {["curr_event"] = <ConceptNode>,
+    #                     ["events"] = [<ConceptNode>, ...],
+    #                     ["thoughts"] = [<ConceptNode>, ...]}
+    focused_event = False
+    if retrieved.keys():
+        focused_event = _choose_retrieved(role.name, retrieved)
+
+    # Step 2: Once we choose an event, we need to determine whether the
+    #         role will take any actions for the perceived event. There are
+    #         three possible modes of reaction returned by _should_react.
+    #         a) "chat with {target_role.name}"
+    #         b) "react"
+    #         c) False
+    logger.info(f"Role: {role.name} focused_event: {focused_event}")
+    if focused_event:
+        reaction_mode = await _should_react(role, focused_event, roles)
+        logger.info(f"Role: {role.name} reaction_mode: {reaction_mode}")
+        if reaction_mode:
+            # If we do want to chat, then we generate conversation
+            if reaction_mode[:9] == "chat with":
+                await _chat_react(role, reaction_mode, roles)
+            elif reaction_mode[:4] == "wait":
+                await _wait_react(role, reaction_mode)
+
+    # Step 3: Chat-related state clean up.
+    # If the persona is not chatting with anyone, we clean up any of the
+    # chat-related states here.
+    if role.rc.scratch.act_event[1] != "chat with":
+        role.rc.scratch.chatting_with = None
+        role.rc.scratch.chat = None
+        role.rc.scratch.chatting_end_time = None
+    # We want to make sure that the persona does not keep conversing with each
+    # other in an infinite loop. So, chatting_with_buffer maintains a form of
+    # buffer that makes the persona wait from talking to the same target
+    # immediately after chatting once. We keep track of the buffer value here.
+    curr_persona_chat_buffer = role.rc.scratch.chatting_with_buffer
+    for persona_name, buffer_count in curr_persona_chat_buffer.items():
+        if persona_name != role.rc.scratch.chatting_with:
+            role.rc.scratch.chatting_with_buffer[persona_name] -= 1
+
+    return role.rc.scratch.act_address
+
+
+def _choose_retrieved(role_name: str, retrieved: dict) -> Union[None, dict]:
+    """
+    Retrieved elements have multiple core "curr_events". We need to choose one
+    event to which we are going to react to. We pick that event here.
+    Args:
+      role_name: Current role instance's name whose action we are determining.
+      retrieved: A dictionary of <ConceptNode> that were retrieved from the
+                 the role's associative memory. This dictionary takes the
+                 following form:
+                 dictionary[event.description] =
+                   {["curr_event"] = <ConceptNode>,
+                    ["events"] = [<ConceptNode>, ...],
+                    ["thoughts"] = [<ConceptNode>, ...] }
+    """
+    # Once we are done with the reflection, we might want to build a more
+    # complex structure here.
+
+    # We do not want to take self events... for now
+    copy_retrieved = retrieved.copy()
+    for event_desc, rel_ctx in copy_retrieved.items():
+        curr_event = rel_ctx["curr_event"]
+        if curr_event.subject == role_name:
+            del retrieved[event_desc]
+
+    # Always choose role first.
+    priority = []
+    for event_desc, rel_ctx in retrieved.items():
+        curr_event = rel_ctx["curr_event"]
+        if ":" not in curr_event.subject and curr_event.subject != role_name:
+            priority += [rel_ctx]
+    if priority:
+        return random.choice(priority)
+
+    # Skip idle.
+    for event_desc, rel_ctx in retrieved.items():
+        if "is idle" not in event_desc:
+            priority += [rel_ctx]
+    if priority:
+        return random.choice(priority)
+    return None
+
+
+async def _should_react(role: "STRole", retrieved: dict, roles: dict):
+    """
+    Determines what form of reaction the role should exihibit given the
+    retrieved values.
+    INPUT
+      role: Current <"STRole"> instance whose action we are determining.
+      retrieved: A dictionary of <ConceptNode> that were retrieved from the
+                 the role's associative memory. This dictionary takes the
+                 following form:
+                 dictionary[event.description] =
+                   {["curr_event"] = <ConceptNode>,
+                    ["events"] = [<ConceptNode>, ...],
+                    ["thoughts"] = [<ConceptNode>, ...] }
+      roles: A dictionary that contains all role names as keys, and the
+                <"STRole"> instance as values.
+    """
+
+    async def lets_talk(init_role: "STRole", target_role: "STRole", retrieved: dict):
+        if init_role.name == target_role.name:
+            logger.info(f"Role: {role.name} _should_react lets_talk meet same role, return False")
+            return False
+
+        scratch = init_role.rc.scratch
+        target_scratch = target_role.rc.scratch
+        if (
+            not target_scratch.act_address
+            or not target_scratch.act_description
+            or not scratch.act_address
+            or not scratch.act_description
+        ):
+            return False
+
+        if "sleeping" in target_scratch.act_description or "sleeping" in scratch.act_description:
+            return False
+
+        if scratch.curr_time.hour == 23:
+            return False
+
+        if "<waiting>" in target_scratch.act_address:
+            return False
+
+        if target_scratch.chatting_with or scratch.chatting_with:
+            return False
+
+        if target_role.name in scratch.chatting_with_buffer:
+            if scratch.chatting_with_buffer[target_role.name] > 0:
+                return False
+
+        if await DecideToTalk().run(init_role, target_role, retrieved):
+            return True
+
+        return False
+
+    async def lets_react(init_role: "STRole", target_role: "STRole", retrieved: dict):
+        if init_role.name == target_role.name:
+            logger.info(f"Role: {role.name} _should_react lets_react meet same role, return False")
+            return False
+
+        scratch = init_role.rc.scratch
+        target_scratch = target_role.rc.scratch
+        if (
+            not target_scratch.act_address
+            or not target_scratch.act_description
+            or not scratch.act_address
+            or not scratch.act_description
+        ):
+            return False
+
+        if "sleeping" in target_scratch.act_description or "sleeping" in scratch.act_description:
+            return False
+
+        # return False
+        if scratch.curr_time.hour == 23:
+            return False
+
+        if "waiting" in target_scratch.act_description:
+            return False
+        if scratch.planned_path == []:
+            return False
+
+        if scratch.act_address != target_scratch.act_address:
+            return False
+
+        react_mode = await DecideToTalk().run(init_role, target_role, retrieved)
+
+        if react_mode == "1":
+            wait_until = (
+                target_scratch.act_start_time + datetime.timedelta(minutes=target_scratch.act_duration - 1)
+            ).strftime("%B %d, %Y, %H:%M:%S")
+            return f"wait: {wait_until}"
+        elif react_mode == "2":
+            return False
+            return "do other things"
+        else:
+            return False  # "keep"
+
+    # If the role is chatting right now, default to no reaction
+    scratch = role.rc.scratch
+    if scratch.chatting_with:
+        return False
+    if "<waiting>" in scratch.act_address:
+        return False
+
+    # Recall that retrieved takes the following form:
+    # dictionary {["curr_event"] = <ConceptNode>}
+    curr_event = retrieved["curr_event"]
+    logger.info(f"Role: {role.name} _should_react curr_event.subject: {curr_event.subject}")
+
+    if ":" not in curr_event.subject:
+        # this is a role event.
+        if await lets_talk(role, roles[curr_event.subject], retrieved):
+            return f"chat with {curr_event.subject}"
+        react_mode = await lets_react(role, roles[curr_event.subject], retrieved)
+        return react_mode
+    return False
+
+
+async def _chat_react(role: "STRole", reaction_mode: str, roles: dict["STRole"]):
+    # There are two roles -- the role who is initiating the conversation
+    # and the role who is the target. We get the role instances here.
+    init_role = role
+    target_role = roles[reaction_mode[9:].strip()]
+
+    # Actually creating the conversation here.
+    convo, duration_min = await generate_convo(init_role, target_role)  # 2222
+    convo_summary = await generate_convo_summary(convo)
+    inserted_act = convo_summary
+    inserted_act_dur = duration_min
+
+    act_start_time = target_role.rc.scratch.act_start_time
+
+    curr_time = target_role.rc.scratch.curr_time
+    if curr_time.second != 0:
+        temp_curr_time = curr_time + datetime.timedelta(seconds=60 - curr_time.second)
+        chatting_end_time = temp_curr_time + datetime.timedelta(minutes=inserted_act_dur)
+    else:
+        chatting_end_time = curr_time + datetime.timedelta(minutes=inserted_act_dur)
+
+    for role, p in [("init", init_role), ("target", target_role)]:
+        if role == "init":
+            act_address = f"<persona> {target_role.name}"
+            act_event = (p.name, "chat with", target_role.name)
+            chatting_with = target_role.name
+            chatting_with_buffer = {}
+            chatting_with_buffer[target_role.name] = 800
+        elif role == "target":
+            act_address = f"<persona> {init_role.name}"
+            act_event = (p.name, "chat with", init_role.name)
+            chatting_with = init_role.name
+            chatting_with_buffer = {}
+            chatting_with_buffer[init_role.name] = 800
+
+        act_pronunciatio = "💬"
+        act_obj_description = None
+        act_obj_pronunciatio = None
+        act_obj_event = (None, None, None)
+
+        await _create_react(
+            p,
+            inserted_act,
+            inserted_act_dur,
+            act_address,
+            act_event,
+            chatting_with,
+            convo,
+            chatting_with_buffer,
+            chatting_end_time,
+            act_pronunciatio,
+            act_obj_description,
+            act_obj_pronunciatio,
+            act_obj_event,
+            act_start_time,
+        )
+
+
+async def _create_react(
+    role: "STRole",
+    inserted_act: str,
+    inserted_act_dur: int,
+    act_address: str,
+    act_event: Tuple,
+    chatting_with: str,
+    chat: list,
+    chatting_with_buffer: dict,
+    chatting_end_time: datetime,
+    act_pronunciatio: str,
+    act_obj_description: str,
+    act_obj_pronunciatio: str,
+    act_obj_event: Tuple,
+    act_start_time=None,
+):
+    p = role
+    scratch = role.rc.scratch
+
+    min_sum = 0
+    for i in range(scratch.get_f_daily_schedule_hourly_org_index()):
+        min_sum += scratch.f_daily_schedule_hourly_org[i][1]
+    start_hour = int(min_sum / 60)
+
+    if scratch.f_daily_schedule_hourly_org[scratch.get_f_daily_schedule_hourly_org_index()][1] >= 120:
+        end_hour = (
+            start_hour + scratch.f_daily_schedule_hourly_org[scratch.get_f_daily_schedule_hourly_org_index()][1] / 60
+        )
+
+    elif (
+        scratch.f_daily_schedule_hourly_org[scratch.get_f_daily_schedule_hourly_org_index()][1]
+        + scratch.f_daily_schedule_hourly_org[scratch.get_f_daily_schedule_hourly_org_index() + 1][1]
+    ):
+        end_hour = start_hour + (
+            (
+                scratch.f_daily_schedule_hourly_org[scratch.get_f_daily_schedule_hourly_org_index()][1]
+                + scratch.f_daily_schedule_hourly_org[scratch.get_f_daily_schedule_hourly_org_index() + 1][1]
+            )
+            / 60
+        )
+
+    else:
+        end_hour = start_hour + 2
+    end_hour = int(end_hour)
+
+    dur_sum = 0
+    count = 0
+    start_index = None
+    end_index = None
+    for act, dur in scratch.f_daily_schedule:
+        if dur_sum >= start_hour * 60 and start_index is None:
+            start_index = count
+        if dur_sum >= end_hour * 60 and end_index is None:
+            end_index = count
+        dur_sum += dur
+        count += 1
+
+    ret = await generate_new_decomp_schedule(p, inserted_act, inserted_act_dur, start_hour, end_hour)
+    scratch.f_daily_schedule[start_index:end_index] = ret
+    scratch.add_new_action(
+        act_address,
+        inserted_act_dur,
+        inserted_act,
+        act_pronunciatio,
+        act_event,
+        chatting_with,
+        chat,
+        chatting_with_buffer,
+        chatting_end_time,
+        act_obj_description,
+        act_obj_pronunciatio,
+        act_obj_event,
+        act_start_time,
+    )
+
+
+async def _wait_react(role: "STRole", reaction_mode: str):
+    scratch = role.rc.scratch
+
+    inserted_act = f'waiting to start {scratch.act_description.split("(")[-1][:-1]}'
+    end_time = datetime.datetime.strptime(reaction_mode[6:].strip(), "%B %d, %Y, %H:%M:%S")
+    inserted_act_dur = (
+        (end_time.minute + end_time.hour * 60) - (scratch.curr_time.minute + scratch.curr_time.hour * 60) + 1
+    )
+
+    act_address = f"<waiting> {scratch.curr_tile[0]} {scratch.curr_tile[1]}"
+    act_event = (role.name, "waiting to start", scratch.act_description.split("(")[-1][:-1])
+    chatting_with = None
+    chat = None
+    chatting_with_buffer = None
+    chatting_end_time = None
+
+    act_pronunciatio = "⌛"
+    act_obj_description = None
+    act_obj_pronunciatio = None
+    act_obj_event = (None, None, None)
+
+    await _create_react(
+        role,
+        inserted_act,
+        inserted_act_dur,
+        act_address,
+        act_event,
+        chatting_with,
+        chat,
+        chatting_with_buffer,
+        chatting_end_time,
+        act_pronunciatio,
+        act_obj_description,
+        act_obj_pronunciatio,
+        act_obj_event,
+    )
+
+
+async def generate_convo(init_role: "STRole", target_role: "STRole") -> Union[list, int]:
+    convo = await agent_conversation(init_role, target_role)
+    all_utt = ""
+
+    for row in convo:
+        speaker = row[0]
+        utt = row[1]
+        all_utt += f"{speaker}: {utt}\n"
+
+    convo_length = math.ceil(int(len(all_utt) / 8) / 30)
+
+    return convo, convo_length
+
+
+async def generate_convo_summary(conv: list[list[str]]) -> str:
+    conv_summary = await SummarizeConv().run(conv)
+    return conv_summary
+
+
+async def generate_new_decomp_schedule(
+    role: "STRole", inserted_act: str, inserted_act_dur: int, start_hour: int, end_hour: int
+):
+    # Step 1: Setting up the core variables for the function.
+    # <p> is the role whose schedule we are editing right now.
+    scratch = role.rc.scratch
+    # <today_min_pass> indicates the number of minutes that have passed today.
+    today_min_pass = int(scratch.curr_time.hour) * 60 + int(scratch.curr_time.minute) + 1
+
+    # Step 2: We need to create <main_act_dur> and <truncated_act_dur>.
+    main_act_dur = []
+    truncated_act_dur = []
+    dur_sum = 0  # duration sum
+    count = 0  # enumerate count
+    truncated_fin = False
+
+    logger.debug(f"DEBUG::: {scratch.name}")
+    for act, dur in scratch.f_daily_schedule:
+        if (dur_sum >= start_hour * 60) and (dur_sum < end_hour * 60):
+            main_act_dur += [[act, dur]]
+            if dur_sum <= today_min_pass:
+                truncated_act_dur += [[act, dur]]
+            elif dur_sum > today_min_pass and not truncated_fin:
+                # We need to insert that last act, duration list like this one:
+                # e.g., ['wakes up and completes her morning routine (wakes up...)', 2]
+                truncated_act_dur += [[scratch.f_daily_schedule[count][0], dur_sum - today_min_pass]]
+                truncated_act_dur[-1][-1] -= (
+                    dur_sum - today_min_pass
+                )  # DEC 7 DEBUG;.. is the +1 the right thing to do???
+                # DEC 7 DEBUG;.. is the +1 the right thing to do???
+                # truncated_act_dur[-1][-1] -= (dur_sum - today_min_pass + 1)
+                logger.debug(f"DEBUG::: {truncated_act_dur}")
+
+                # DEC 7 DEBUG;.. is the +1 the right thing to do???
+                # truncated_act_dur[-1][-1] -= (dur_sum - today_min_pass)
+                truncated_fin = True
+        dur_sum += dur
+        count += 1
+
+    main_act_dur = main_act_dur
+
+    x = (
+        truncated_act_dur[-1][0].split("(")[0].strip()
+        + " (on the way to "
+        + truncated_act_dur[-1][0].split("(")[-1][:-1]
+        + ")"
+    )
+    truncated_act_dur[-1][0] = x
+
+    if "(" in truncated_act_dur[-1][0]:
+        inserted_act = truncated_act_dur[-1][0].split("(")[0].strip() + " (" + inserted_act + ")"
+
+    # To do inserted_act_dur+1 below is an important decision but I'm not sure
+    # if I understand the full extent of its implications. Might want to
+    # revisit.
+    truncated_act_dur += [[inserted_act, inserted_act_dur]]
+    start_time_hour = datetime.datetime(2022, 10, 31, 0, 0) + datetime.timedelta(hours=start_hour)
+    end_time_hour = datetime.datetime(2022, 10, 31, 0, 0) + datetime.timedelta(hours=end_hour)
+
+    return await NewDecompSchedule().run(
+        role, main_act_dur, truncated_act_dur, start_time_hour, end_time_hour, inserted_act, inserted_act_dur
+    )
+
+
+async def _long_term_planning(role: "STRole", new_day: bool):
+    """
+    Formulates the role's daily long-term plan if it is the start of a new
+    day. This basically has two components: first, we create the wake-up hour,
+    and second, we create the hourly schedule based on it.
+    INPUT
+        new_day: Indicates whether the current time signals a "First day",
+                "New day", or False (for neither). This is important because we
+                create the roles' long term planning on the new day.
+    """
+    # We start by creating the wake up hour for the role.
+    wake_up_hour = await WakeUp().run(role)
+    wake_up_hour = int(wake_up_hour)
+    logger.info(f"Role: {role.name} long_term_planning, wake_up_hour: {wake_up_hour}")
+
+    # When it is a new day, we start by creating the daily_req of the role.
+    # Note that the daily_req is a list of strings that describe the role's
+    # day in broad strokes.
+    if new_day == "First day":
+        # Bootstrapping the daily plan for the start of then generation:
+        # if this is the start of generation (so there is no previous day's
+        # daily requirement, or if we are on a new day, we want to create a new
+        # set of daily requirements.
+        role.scratch.daily_req = await GenDailySchedule().run(role, wake_up_hour)
+        logger.info(f"Role: {role.name} daily requirements: {role.scratch.daily_req}")
+    elif new_day == "New day":
+        revise_identity(role)
+
+        # - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - TODO
+        # We need to create a new daily_req here...
+        role.scratch.daily_req = role.scratch.daily_req
+
+    # Based on the daily_req, we create an hourly schedule for the role,
+    # which is a list of todo items with a time duration (in minutes) that
+    # add up to 24 hours.
+    role.scratch.f_daily_schedule = await GenHourlySchedule().run(role, wake_up_hour)
+    logger.info(f"Role: {role.name} f_daily_schedule: {role.scratch.f_daily_schedule}")
+    role.scratch.f_daily_schedule_hourly_org = role.scratch.f_daily_schedule[:]
+
+    # Added March 4 -- adding plan to the memory.
+    thought = f"This is {role.scratch.name}'s plan for {role.scratch.curr_time.strftime('%A %B %d')}:"
+    for i in role.scratch.daily_req:
+        thought += f" {i},"
+    thought = thought[:-1] + "."
+    created = role.scratch.curr_time
+    expiration = role.scratch.curr_time + datetime.timedelta(days=30)
+    s, p, o = (role.scratch.name, "plan", role.scratch.curr_time.strftime("%A %B %d"))
+    keywords = set(["plan"])
+    thought_poignancy = 5
+    thought_embedding_pair = (thought, get_embedding(thought))
+    role.a_mem.add_thought(
+        created, expiration, s, p, o, thought, keywords, thought_poignancy, thought_embedding_pair, None
+    )
+
+
+async def _determine_action(role: "STRole"):
+    """
+    Creates the next action sequence for the role.
+    The main goal of this function is to run "add_new_action" on the role's
+    scratch space, which sets up all the action related variables for the next
+    action.
+    As a part of this, the role may need to decompose its hourly schedule as
+    needed.
+    INPUT
+        role: Current <Persona> instance whose action we are determining.
+    """
+
+    def determine_decomp(act_desp, act_dura):
+        """
+        Given an action description and its duration, we determine whether we need
+        to decompose it. If the action is about the agent sleeping, we generally
+        do not want to decompose it, so that's what we catch here.
+
+        INPUT:
+        act_desp: the description of the action (e.g., "sleeping")
+        act_dura: the duration of the action in minutes.
+        OUTPUT:
+        a boolean. True if we need to decompose, False otherwise.
+        """
+        if "sleep" not in act_desp and "bed" not in act_desp:
+            return True
+        elif "sleeping" in act_desp or "asleep" in act_desp or "in bed" in act_desp:
+            return False
+        elif "sleep" in act_desp or "bed" in act_desp:
+            if act_dura > 60:
+                return False
+        return True
+
+    # The goal of this function is to get us the action associated with
+    # <curr_index>. As a part of this, we may need to decompose some large
+    # chunk actions.
+    # Importantly, we try to decompose at least two hours worth of schedule at
+    # any given point.
+    curr_index = role.scratch.get_f_daily_schedule_index()
+    curr_index_60 = role.scratch.get_f_daily_schedule_index(advance=60)
+
+    logger.info(f"f_daily_schedule: {role.scratch.f_daily_schedule}")
+    # * Decompose *
+    # During the first hour of the day, we need to decompose two hours
+    # sequence. We do that here.
+    if curr_index == 0:
+        # This portion is invoked if it is the first hour of the day.
+        act_desp, act_dura = role.scratch.f_daily_schedule[curr_index]
+        if act_dura >= 60:
+            # We decompose if the next action is longer than an hour, and fits the
+            # criteria described in determine_decomp.
+            if determine_decomp(act_desp, act_dura):
+                role.scratch.f_daily_schedule[curr_index : curr_index + 1] = await TaskDecomp().run(
+                    role, act_desp, act_dura
+                )
+        if curr_index_60 + 1 < len(role.scratch.f_daily_schedule):
+            act_desp, act_dura = role.scratch.f_daily_schedule[curr_index_60 + 1]
+            if act_dura >= 60:
+                if determine_decomp(act_desp, act_dura):
+                    role.scratch.f_daily_schedule[curr_index_60 + 1 : curr_index_60 + 2] = await TaskDecomp().run(
+                        role, act_desp, act_dura
+                    )
+
+    if curr_index_60 < len(role.scratch.f_daily_schedule):
+        # If it is not the first hour of the day, this is always invoked (it is
+        # also invoked during the first hour of the day -- to double up so we can
+        # decompose two hours in one go). Of course, we need to have something to
+        # decompose as well, so we check for that too.
+        if role.scratch.curr_time.hour < 23:
+            # And we don't want to decompose after 11 pm.
+            act_desp, act_dura = role.scratch.f_daily_schedule[curr_index_60]
+            if act_dura >= 60:
+                if determine_decomp(act_desp, act_dura):
+                    role.scratch.f_daily_schedule[curr_index_60 : curr_index_60 + 1] = await TaskDecomp().run(
+                        role, act_desp, act_dura
+                    )
+    # * End of Decompose *
+
+    # Generate an <Action> instance from the action description and duration. By
+    # this point, we assume that all the relevant actions are decomposed and
+    # ready in f_daily_schedule.
+    logger.debug("DEBUG LJSDLFSKJF")
+    for i in role.scratch.f_daily_schedule:
+        logger.debug(i)
+    logger.debug(curr_index)
+    logger.debug(len(role.scratch.f_daily_schedule))
+    logger.debug(role.scratch.name)
+
+    # 1440
+    x_emergency = 0
+    for i in role.scratch.f_daily_schedule:
+        x_emergency += i[1]
+
+    if 1440 - x_emergency > 0:
+        logger.info(f"x_emergency__AAA: {x_emergency}")
+    role.scratch.f_daily_schedule += [["sleeping", 1440 - x_emergency]]
+
+    act_desp, act_dura = role.scratch.f_daily_schedule[curr_index]
+
+    new_action_details = await GenActionDetails().run(role, act_desp, act_dura)
+    # Adding the action to role's queue.
+    role.scratch.add_new_action(**new_action_details)
+
+
+def revise_identity(role: "STRole"):
+    p_name = role.scratch.name
+
+    focal_points = [
+        f"{p_name}'s plan for {role.scratch.get_str_curr_date_str()}.",
+        f"Important recent events for {p_name}'s life.",
+    ]
+    retrieved = new_agent_retrieve(role, focal_points)
+
+    statements = "[Statements]\n"
+    for key, val in retrieved.items():
+        for i in val:
+            statements += f"{i.created.strftime('%A %B %d -- %H:%M %p')}: {i.embedding_key}\n"
+
+    plan_prompt = statements + "\n"
+    plan_prompt += f"Given the statements above, is there anything that {p_name} should remember as they plan for"
+    plan_prompt += f" *{role.scratch.curr_time.strftime('%A %B %d')}*? "
+    plan_prompt += "If there is any scheduling information, be as specific as possible (include date, time, and location if stated in the statement)\n\n"
+    plan_prompt += f"Write the response from {p_name}'s perspective."
+    plan_note = LLM().ask(plan_prompt)
+
+    thought_prompt = statements + "\n"
+    thought_prompt += (
+        f"Given the statements above, how might we summarize {p_name}'s feelings about their days up to now?\n\n"
+    )
+    thought_prompt += f"Write the response from {p_name}'s perspective."
+    thought_note = LLM().ask(thought_prompt)
+
+    currently_prompt = (
+        f"{p_name}'s status from {(role.scratch.curr_time - datetime.timedelta(days=1)).strftime('%A %B %d')}:\n"
+    )
+    currently_prompt += f"{role.scratch.currently}\n\n"
+    currently_prompt += f"{p_name}'s thoughts at the end of {(role.scratch.curr_time - datetime.timedelta(days=1)).strftime('%A %B %d')}:\n"
+    currently_prompt += (plan_note + thought_note).replace("\n", "") + "\n\n"
+    currently_prompt += f"It is now {role.scratch.curr_time.strftime('%A %B %d')}. Given the above, write {p_name}'s status for {role.scratch.curr_time.strftime('%A %B %d')} that reflects {p_name}'s thoughts at the end of {(role.scratch.curr_time - datetime.timedelta(days=1)).strftime('%A %B %d')}. Write this in third-person talking about {p_name}."
+    currently_prompt += "If there is any scheduling information, be as specific as possible (include date, time, and location if stated in the statement).\n\n"
+    currently_prompt += "Follow this format below:\nStatus: <new status>"
+    new_currently = LLM().ask(currently_prompt)
+
+    role.scratch.currently = new_currently
+
+    daily_req_prompt = role.scratch.get_str_iss() + "\n"
+    daily_req_prompt += f"Today is {role.scratch.curr_time.strftime('%A %B %d')}. Here is {role.scratch.name}'s plan today in broad-strokes (with the time of the day. e.g., have a lunch at 12:00 pm, watch TV from 7 to 8 pm).\n\n"
+    daily_req_prompt += "Follow this format (the list should have 4~6 items but no more):\n"
+    daily_req_prompt += "1. wake up and complete the morning routine at <time>, 2. ..."
+
+    new_daily_req = LLM().ask(daily_req_prompt)
+    new_daily_req = new_daily_req.replace("\n", " ")
+    role.scratch.daily_plan_req = new_daily_req
diff --git a/metagpt/ext/stanford_town/prompts/__init__.py b/metagpt/ext/stanford_town/prompts/__init__.py
new file mode 100644
index 000000000..2af51b8dc
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : stanford town prompt templates
diff --git a/metagpt/ext/stanford_town/prompts/action_location_object_vMar11.txt b/metagpt/ext/stanford_town/prompts/action_location_object_vMar11.txt
new file mode 100644
index 000000000..908750646
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/action_location_object_vMar11.txt
@@ -0,0 +1,30 @@
+Variables: 
+!<INPUT 0>! -- Persona name
+!<INPUT 1>! -- Persona's current arena
+!<INPUT 2>! -- Persona's current sector
+!<INPUT 3>! -- Persona name
+!<INPUT 4>! -- target sector
+!<INPUT 5>! -- Persona's sector's all arenas (minus no access)
+!<INPUT 6>! -- Curr action seq
+!<INPUT 7>! -- Persona name
+!<INPUT 8>! -- Persona's current sector
+
+<commentblockmarker>###</commentblockmarker>
+Jane Anderson is in kitchen in Jane Anderson's house.
+Jane Anderson is going to Jane Anderson's house that has the following areas: {kitchen,  bedroom, bathroom}
+Stay in the current area if the activity can be done there. Never go into other people's rooms unless necessary.
+For cooking, Jane Anderson should go to the following area in Jane Anderson's house:
+Answer: {kitchen}
+---
+Tom Watson is in common room in Tom Watson's apartment. 
+Tom Watson is going to Hobbs Cafe that has the following areas: {cafe}
+Stay in the current area if the activity can be done there. Never go into other people's rooms unless necessary.
+For getting coffee, Tom Watson should go to the following area in Hobbs Cafe:
+Answer: {cafe}
+---
+
+!<INPUT 0>! is going to !<INPUT 1>! that has the following areas: {!<INPUT 2>!}
+* Stay in the current area if the activity can be done there. 
+* NEVER go into other people's rooms unless necessary.
+!<INPUT 3>! is !<INPUT 4>!. For !<INPUT 5>!, !<INPUT 6>! should go to the following area in !<INPUT 7>! (MUST pick one of {!<INPUT 8>!}):
+Answer: {
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/action_location_sector_v1.txt b/metagpt/ext/stanford_town/prompts/action_location_sector_v1.txt
new file mode 100644
index 000000000..f93ed96e0
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/action_location_sector_v1.txt
@@ -0,0 +1,34 @@
+Variables: 
+!<INPUT 0>! -- Persona name
+!<INPUT 1>! -- Maze all possible sectors
+!<INPUT 2>! -- Persona name
+!<INPUT 3>! -- Persona living sector
+!<INPUT 4>! -- Persona living sector arenas
+!<INPUT 5>! -- Persona name
+!<INPUT 6>! -- Persona current sector
+!<INPUT 7>! -- Persona current sector arenas
+!<INPUT 8>! -- curr action description
+!<INPUT 9>! -- Persona name
+<commentblockmarker>###</commentblockmarker>
+Task -- choose an appropriate area  from the area options for a task at hand. 
+
+Sam Kim lives in {Sam Kim's house} that has Sam Kim's room, bathroom, kitchen.
+Sam Kim is currently in {Sam Kim's house} that has Sam Kim's room, bathroom, kitchen. 
+Area options: {Sam Kim's house, The Rose and Crown Pub, Hobbs Cafe, Oak Hill College, Johnson Park, Harvey Oak Supply Store, The Willows Market and Pharmacy}.
+* Stay in the current area if the activity can be done there. Only go out if the activity needs to take place in another place.
+* Must be one of the "Area options," verbatim.
+For taking a walk, Sam Kim should go to the following area: {Johnson Park}
+---
+Jane Anderson lives in {Oak Hill College Student Dormatory} that has Jane Anderson's room.
+Jane Anderson is currently in {Oak Hill College} that has a classroom, library
+Area options: {Oak Hill College Student Dormatory, The Rose and Crown Pub, Hobbs Cafe, Oak Hill College, Johnson Park, Harvey Oak Supply Store, The Willows Market and Pharmacy}. 
+* Stay in the current area if the activity can be done there. Only go out if the activity needs to take place in another place.
+* Must be one of the "Area options," verbatim.
+For eating dinner, Jane Anderson should go to the following area: {Hobbs Cafe}
+---
+!<INPUT 0>! lives in {!<INPUT 1>!} that has !<INPUT 2>!.
+!<INPUT 3>! is currently in {!<INPUT 4>!} that has !<INPUT 5>!. !<INPUT 6>!
+Area options: {!<INPUT 7>!}. 
+* Stay in the current area if the activity can be done there. Only go out if the activity needs to take place in another place.
+* Must be one of the "Area options," verbatim.
+!<INPUT 8>! is !<INPUT 9>!. For !<INPUT 10>!, !<INPUT 11>! should go to the following area: {
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/action_object_v2.txt b/metagpt/ext/stanford_town/prompts/action_object_v2.txt
new file mode 100644
index 000000000..1a8a78e16
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/action_object_v2.txt
@@ -0,0 +1,32 @@
+Variables: 
+!<INPUT 0>! -- curr action seq
+!<INPUT 1>! -- Objects available
+
+<commentblockmarker>###</commentblockmarker>
+Current activity: sleep in bed
+Objects available: {bed, easel, closet, painting}
+Pick ONE most relevant object from the objects available: bed
+---
+Current activity: painting
+Objects available: {easel, closet, sink, microwave}
+Pick ONE most relevant object from the objects available: easel
+---
+Current activity: cooking
+Objects available: {stove, sink, fridge, counter}
+Pick ONE most relevant object from the objects available: stove
+---
+Current activity: watch TV
+Objects available: {couch, TV, remote, coffee table}
+Pick ONE most relevant object from the objects available: TV
+---
+Current activity: study
+Objects available: {desk, computer, chair, bookshelf}
+Pick ONE most relevant object from the objects available: desk
+---
+Current activity: talk on the phone
+Objects available: {phone, charger, bed, nightstand}
+Pick ONE most relevant object from the objects available: phone
+---
+Current activity: !<INPUT 0>!
+Objects available: {!<INPUT 1>!}
+Pick ONE most relevant object from the objects available:
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/daily_planning_v6.txt b/metagpt/ext/stanford_town/prompts/daily_planning_v6.txt
new file mode 100644
index 000000000..dea6a28d7
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/daily_planning_v6.txt
@@ -0,0 +1,14 @@
+daily_planning_v6.txt
+
+Variables: 
+!<INPUT 0>! -- Commonset
+!<INPUT 1>! -- Lifestyle
+!<INPUT 2>! -- Reverie date time now
+!<INPUT 3>! -- Persona first names
+!<INPUT 4>! -- wake_up_hour
+
+<commentblockmarker>###</commentblockmarker>
+!<INPUT 0>!
+
+In general, !<INPUT 1>!
+Today is !<INPUT 2>!. Here is !<INPUT 3>!'s plan today in broad-strokes (with the time of the day. e.g., have a lunch at 12:00 pm, watch TV from 7 to 8 pm): 1) wake up and complete the morning routine at !<INPUT 4>!, 2)
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/decide_to_talk_v2.txt b/metagpt/ext/stanford_town/prompts/decide_to_talk_v2.txt
new file mode 100644
index 000000000..94204f9eb
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/decide_to_talk_v2.txt
@@ -0,0 +1,18 @@
+decide_to_talk_v1.txt
+
+<commentblockmarker>###</commentblockmarker>
+Task -- given context, determine whether the subject will initiate a conversation with another. 
+Format: 
+Context: []
+Question: []
+Reasoning: []
+Answer in "yes" or "no": []
+---
+Context: !<INPUT 0>! 
+Right now, it is !<INPUT 1>!. !<INPUT 2>! and !<INPUT 3>! last chatted at !<INPUT 4>! about !<INPUT 5>!. 
+!<INPUT 6>! 
+!<INPUT 7>! 
+
+Question: Would !<INPUT 8>! initiate a conversation with !<INPUT 9>!? 
+
+Reasoning: Let's think step by step.
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/generate_event_triple_v1.txt b/metagpt/ext/stanford_town/prompts/generate_event_triple_v1.txt
new file mode 100644
index 000000000..1e9b7d6d5
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/generate_event_triple_v1.txt
@@ -0,0 +1,30 @@
+generate_event_triple_v1.txt
+
+Variables: 
+!<INPUT 0>! -- Persona's full name. 
+!<INPUT 1>! -- Current action description
+!<INPUT 2>! -- Persona's full name. 
+
+<commentblockmarker>###</commentblockmarker>
+Task: Turn the input into (subject, predicate, object). 
+
+Input: Sam Johnson is eating breakfast. 
+Output: (Dolores Murphy, eat, breakfast) 
+--- 
+Input: Joon Park is brewing coffee.
+Output: (Joon Park, brew, coffee)
+---
+Input: Jane Cook is sleeping. 
+Output: (Jane Cook, is, sleep)
+---
+Input: Michael Bernstein is writing email on a computer. 
+Output: (Michael Bernstein, write, email)
+---
+Input: Percy Liang is teaching students in a classroom. 
+Output: (Percy Liang, teach, students)
+---
+Input: Merrie Morris is running on a treadmill. 
+Output: (Merrie Morris, run, treadmill)
+---
+Input: !<INPUT 0>! is !<INPUT 1>!. 
+Output: (!<INPUT 2>!,
diff --git a/metagpt/ext/stanford_town/prompts/generate_focal_pt_v1.txt b/metagpt/ext/stanford_town/prompts/generate_focal_pt_v1.txt
new file mode 100644
index 000000000..73f76ec61
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/generate_focal_pt_v1.txt
@@ -0,0 +1,11 @@
+generate_focal_pt_v1.txt
+
+Variables: 
+!<INPUT 0>! -- Event/thought statements 
+!<INPUT 1>! -- Count 
+
+<commentblockmarker>###</commentblockmarker>
+!<INPUT 0>!
+
+Given only the information above, what are !<INPUT 1>! most salient high-level questions we can answer about the subjects grounded in the statements?
+1)
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/generate_hourly_schedule_v2.txt b/metagpt/ext/stanford_town/prompts/generate_hourly_schedule_v2.txt
new file mode 100644
index 000000000..2d6f5762c
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/generate_hourly_schedule_v2.txt
@@ -0,0 +1,18 @@
+generate_hourly_schedule_v2.txt
+
+Variables: 
+!<INPUT 0>! -- Schedule format
+!<INPUT 1>! -- Commonset
+!<INPUT 2>! -- prior_schedule
+!<INPUT 3>! -- intermission_str
+!<INPUT 4>! -- intermission 2
+!<INPUT 5>! -- prompt_ending
+
+<commentblockmarker>###</commentblockmarker>
+Hourly schedule format: 
+!<INPUT 0>!
+===
+!<INPUT 1>!
+!<INPUT 2>!
+!<INPUT 3>!!<INPUT 4>!
+!<INPUT 5>!
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/generate_obj_event_v1.txt b/metagpt/ext/stanford_town/prompts/generate_obj_event_v1.txt
new file mode 100644
index 000000000..e8d45e638
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/generate_obj_event_v1.txt
@@ -0,0 +1,16 @@
+generate_obj_event_v1.txt
+
+Variables: 
+!<INPUT 0>! -- Object name 
+!<INPUT 1>! -- Persona name
+!<INPUT 2>! -- Persona action event description 
+!<INPUT 3>! -- Object name 
+!<INPUT 4>! -- Object name 
+
+<commentblockmarker>###</commentblockmarker>
+Task: We want to understand the state of an object that is being used by someone. 
+
+Let's think step by step. 
+We want to know about !<INPUT 0>!'s state. 
+Step 1. !<INPUT 1>! is at/using the !<INPUT 2>!.
+Step 2. Describe the !<INPUT 3>!'s state: !<INPUT 4>! is
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/generate_pronunciatio_v1.txt b/metagpt/ext/stanford_town/prompts/generate_pronunciatio_v1.txt
new file mode 100644
index 000000000..fd208df18
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/generate_pronunciatio_v1.txt
@@ -0,0 +1,10 @@
+generate_pronunciatio_v1.txt
+
+Variables: 
+!<INPUT 0>! -- Action description
+
+<commentblockmarker>###</commentblockmarker>
+Convert an action description to an emoji (important: use two or less emojis).
+
+Action description: !<INPUT 0>!
+Emoji:
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/insight_and_evidence_v1.txt b/metagpt/ext/stanford_town/prompts/insight_and_evidence_v1.txt
new file mode 100644
index 000000000..35671023b
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/insight_and_evidence_v1.txt
@@ -0,0 +1,12 @@
+insight_and_evidence_v1.txt
+
+Variables: 
+!<INPUT 0>! -- Numbered list of event/thought statements
+!<INPUT 1>! -- target persona name or "the conversation"
+
+<commentblockmarker>###</commentblockmarker>
+Input:
+!<INPUT 0>!
+
+What !<INPUT 1>! high-level insights can you infer from the above statements? Please ensure it includes 'because of' and generates according to the example format.(example format: insight (because of 1, 5, 3)) .
+1.
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/iterative_convo_v1.txt b/metagpt/ext/stanford_town/prompts/iterative_convo_v1.txt
new file mode 100644
index 000000000..7bd4e7216
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/iterative_convo_v1.txt
@@ -0,0 +1,46 @@
+iterative_convo_v1.txt
+
+Variables: 
+!<INPUT 0>! -- persona ISS
+!<INPUT 1>! -- persona name
+!<INPUT 2>! -- retrieved memory
+!<INPUT 3>! -- past context
+!<INPUT 4>! -- current location
+!<INPUT 5>! -- current context
+!<INPUT 6>! -- persona name
+!<INPUT 7>! -- target persona name
+!<INPUT 8>! -- curr convo
+!<INPUT 9>! -- persona name
+!<INPUT 10>! -- target persona name
+!<INPUT 11>! -- persona name
+!<INPUT 12>! -- persona name
+!<INPUT 13>! -- persona name
+<commentblockmarker>###</commentblockmarker>
+Context for the task: 
+
+PART 1. 
+!<INPUT 0>!
+
+Here is the memory that is in !<INPUT 1>!'s head: 
+!<INPUT 2>!
+
+PART 2. 
+Past Context: 
+!<INPUT 3>!
+
+Current Location: !<INPUT 4>!
+
+Current Context: 
+!<INPUT 5>!
+
+!<INPUT 6>! and !<INPUT 7>! are chatting. Here is their conversation so far: 
+!<INPUT 8>!
+
+---
+Task: Given the above, what should !<INPUT 9>! say to !<INPUT 10>! next in the conversation? And did it end the conversation?
+
+Output format: Output a json of the following format: 
+{
+"!<INPUT 11>!": "<!<INPUT 12>!'s utterance>",
+"Did the conversation end with !<INPUT 13>!'s utterance?": "<json Boolean>"
+}
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/memo_on_convo_v1.txt b/metagpt/ext/stanford_town/prompts/memo_on_convo_v1.txt
new file mode 100644
index 000000000..38b34bfbd
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/memo_on_convo_v1.txt
@@ -0,0 +1,15 @@
+memo_on_convo_v1.txt
+
+Variables: 
+!<INPUT 0>! -- All convo utterances
+!<INPUT 1>! -- persona name
+!<INPUT 2>! -- persona name
+!<INPUT 3>! -- persona name
+
+<commentblockmarker>###</commentblockmarker>
+[Conversation]
+!<INPUT 0>!
+
+Write down if there is anything from the conversation that !<INPUT 1>! might have found interesting from !<INPUT 2>!'s perspective, in a full sentence. 
+
+"!<INPUT 3>!
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/new_decomp_schedule_v1.txt b/metagpt/ext/stanford_town/prompts/new_decomp_schedule_v1.txt
new file mode 100644
index 000000000..e21dc69eb
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/new_decomp_schedule_v1.txt
@@ -0,0 +1,24 @@
+new_decomp_schedule_v1.txt
+
+Variables: 
+!<INPUT 0>! -- persona name 
+!<INPUT 1>! -- start hour
+!<INPUT 2>! -- end hour 
+!<INPUT 3>! -- original plan
+!<INPUT 4>! -- persona name
+!<INPUT 5>! -- new event
+!<INPUT 6>! -- new event duration
+!<INPUT 7>! -- persona name 
+!<INPUT 8>! -- start hour
+!<INPUT 9>! -- end hour 
+!<INPUT 10>! -- end hour 
+!<INPUT 11>! -- new schedule init 
+
+
+<commentblockmarker>###</commentblockmarker>
+Here was !<INPUT 0>!'s originally planned schedule from !<INPUT 1>! to !<INPUT 2>!. 
+!<INPUT 3>!
+
+But !<INPUT 4>! unexpectedly ended up !<INPUT 5>! for !<INPUT 6>! minutes. Revise !<INPUT 7>!'s schedule from !<INPUT 8>! to !<INPUT 9>! accordingly (it has to end by !<INPUT 10>!). 
+The revised schedule:
+!<INPUT 11>!
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/planning_thought_on_convo_v1.txt b/metagpt/ext/stanford_town/prompts/planning_thought_on_convo_v1.txt
new file mode 100644
index 000000000..0563dcee9
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/planning_thought_on_convo_v1.txt
@@ -0,0 +1,15 @@
+planning_thought_on_convo_v1.txt
+
+Variables: 
+!<INPUT 0>! -- All convo utterances
+!<INPUT 1>! -- persona name
+!<INPUT 2>! -- persona name
+!<INPUT 3>! -- persona name
+
+<commentblockmarker>###</commentblockmarker>
+[Conversation]
+!<INPUT 0>!
+
+Write down if there is anything from the conversation that !<INPUT 1>! need to remember for her planning, from !<INPUT 2>!'s perspective, in a full sentence.
+
+"!<INPUT 3>!
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/poignancy_action_v1.txt b/metagpt/ext/stanford_town/prompts/poignancy_action_v1.txt
new file mode 100644
index 000000000..34975696b
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/poignancy_action_v1.txt
@@ -0,0 +1,15 @@
+poignancy_event_v1.txt
+
+!<INPUT 1>!: agent name
+!<INPUT 1>!: iss
+!<INPUT 2>!: name 
+!<INPUT 3>!: event description
+
+<commentblockmarker>###</commentblockmarker>
+Here is a brief description of !<INPUT 0>!. 
+!<INPUT 1>!
+
+On the scale of 1 to 10, where 1 is purely mundane (e.g., brushing teeth, making bed) and 10 is extremely poignant (e.g., a break up, college acceptance), rate the likely poignancy of the following event for !<INPUT 2>!.
+
+Event: !<INPUT 3>!
+Rate (return a number between 1 to 10):
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/poignancy_chat_v1.txt b/metagpt/ext/stanford_town/prompts/poignancy_chat_v1.txt
new file mode 100644
index 000000000..572dd8a05
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/poignancy_chat_v1.txt
@@ -0,0 +1,17 @@
+poignancy_chat_v1.txt
+
+!<INPUT 1>!: agent name
+!<INPUT 1>!: iss
+!<INPUT 2>!: name 
+!<INPUT 3>!: event description
+
+<commentblockmarker>###</commentblockmarker>
+Here is a brief description of !<INPUT 0>!. 
+!<INPUT 1>!
+
+On the scale of 1 to 10, where 1 is purely mundane (e.g., routine morning greetings) and 10 is extremely poignant (e.g., a conversation about breaking up, a fight), rate the likely poignancy of the following conversation for !<INPUT 2>!.
+
+Conversation: 
+!<INPUT 3>!
+
+Rate (return a number between 1 to 10):
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/poignancy_event_v1.txt b/metagpt/ext/stanford_town/prompts/poignancy_event_v1.txt
new file mode 100644
index 000000000..34975696b
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/poignancy_event_v1.txt
@@ -0,0 +1,15 @@
+poignancy_event_v1.txt
+
+!<INPUT 1>!: agent name
+!<INPUT 1>!: iss
+!<INPUT 2>!: name 
+!<INPUT 3>!: event description
+
+<commentblockmarker>###</commentblockmarker>
+Here is a brief description of !<INPUT 0>!. 
+!<INPUT 1>!
+
+On the scale of 1 to 10, where 1 is purely mundane (e.g., brushing teeth, making bed) and 10 is extremely poignant (e.g., a break up, college acceptance), rate the likely poignancy of the following event for !<INPUT 2>!.
+
+Event: !<INPUT 3>!
+Rate (return a number between 1 to 10):
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/poignancy_thought_v1.txt b/metagpt/ext/stanford_town/prompts/poignancy_thought_v1.txt
new file mode 100644
index 000000000..9a4db5166
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/poignancy_thought_v1.txt
@@ -0,0 +1,15 @@
+poignancy_thought_v1.txt
+
+!<INPUT 1>!: agent name
+!<INPUT 1>!: iss
+!<INPUT 2>!: name 
+!<INPUT 3>!: event description
+
+<commentblockmarker>###</commentblockmarker>
+Here is a brief description of !<INPUT 0>!. 
+!<INPUT 1>!
+
+On the scale of 1 to 10, where 1 is purely mundane (e.g., I need to do the dishes, I need to walk the dog) and 10 is extremely significant (e.g., I wish to become a professor, I love Elie), rate the likely significance of the following thought for !<INPUT 2>!.
+
+Thought: !<INPUT 3>!
+Rate (return a number between 1 to 10):
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/summarize_chat_relationship_v2.txt b/metagpt/ext/stanford_town/prompts/summarize_chat_relationship_v2.txt
new file mode 100644
index 000000000..6f71824da
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/summarize_chat_relationship_v2.txt
@@ -0,0 +1,15 @@
+summarize_chat_relationship_v2.txt
+
+Variables: 
+!<INPUT 0>! -- Statements
+!<INPUT 1>! -- curr persona name
+!<INPUT 2>! -- target_persona.scratch.name
+
+<commentblockmarker>###</commentblockmarker>
+[Statements]
+!<INPUT 0>!
+
+Based on the statements above, summarize !<INPUT 1>! and !<INPUT 2>!'s relationship. What do they feel or know about each other?
+
+
+"
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/summarize_conversation_v1.txt b/metagpt/ext/stanford_town/prompts/summarize_conversation_v1.txt
new file mode 100644
index 000000000..1cb423c7d
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/summarize_conversation_v1.txt
@@ -0,0 +1,11 @@
+summarize_conversation_v1.txt
+
+Variables: 
+!<INPUT 0>! -- init_persona_name
+
+<commentblockmarker>###</commentblockmarker>
+Conversation: 
+!<INPUT 0>!
+
+Summarize the conversation above in one sentence:
+This is a conversation about
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/task_decomp_v3.txt b/metagpt/ext/stanford_town/prompts/task_decomp_v3.txt
new file mode 100644
index 000000000..2ba016c21
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/task_decomp_v3.txt
@@ -0,0 +1,39 @@
+task_decomp_v2.txt
+
+Variables: 
+!<INPUT 0>! -- Commonset
+!<INPUT 1>! -- Surrounding schedule description
+!<INPUT 2>! -- Persona first name
+!<INPUT 3>! -- Persona first name
+!<INPUT 4>! -- Current action
+!<INPUT 5>! -- curr time range
+!<INPUT 6>! -- Current action duration in min
+!<INPUT 7>! -- Persona first names
+
+<commentblockmarker>###</commentblockmarker>
+Describe subtasks in 5 min increments. 
+---
+Name: Kelly Bronson
+Age: 35
+Backstory: Kelly always wanted to be a teacher, and now she teaches kindergarten. During the week, she dedicates herself to her students, but on the weekends, she likes to try out new restaurants and hang out with friends. She is very warm and friendly, and loves caring for others.
+Personality: sweet, gentle, meticulous
+Location: Kelly is in an older condo that has the following areas: {kitchen, bedroom, dining, porch, office, bathroom, living room, hallway}.
+Currently: Kelly is a teacher during the school year. She teaches at the school but works on lesson plans at home. She is currently living alone in a single bedroom condo.
+Daily plan requirement: Kelly is planning to teach during the morning and work from home in the afternoon.s
+
+Today is Saturday May 10. From 08:00am ~09:00am, Kelly is planning on having breakfast, from 09:00am ~ 12:00pm, Kelly is planning on working on the next day's kindergarten lesson plan, and from 12:00 ~ 13pm, Kelly is planning on taking a break. 
+In 5 min increments, list the subtasks Kelly does when Kelly is working on the next day's kindergarten lesson plan from 09:00am ~ 12:00pm (total duration in minutes: 180):
+1) Kelly is reviewing the kindergarten curriculum standards. (duration in minutes: 15, minutes left: 165)
+2) Kelly is brainstorming ideas for the lesson. (duration in minutes: 30, minutes left: 135)
+3) Kelly is creating the lesson plan. (duration in minutes: 30, minutes left: 105)
+4) Kelly is creating materials for the lesson. (duration in minutes: 30, minutes left: 75)
+5) Kelly is taking a break. (duration in minutes: 15, minutes left: 60)
+6) Kelly is reviewing the lesson plan. (duration in minutes: 30, minutes left: 30)
+7) Kelly is making final changes to the lesson plan. (duration in minutes: 15, minutes left: 15)
+8) Kelly is printing the lesson plan. (duration in minutes: 10, minutes left: 5)
+9) Kelly is putting the lesson plan in her bag. (duration in minutes: 5, minutes left: 0)
+---
+!<INPUT 0>!
+!<INPUT 1>!
+In 5 min increments, list the subtasks !<INPUT 2>! does when !<INPUT 3>! is !<INPUT 4>! from !<INPUT 5>! (total duration in minutes !<INPUT 6>!): 
+1) !<INPUT 7>! is
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/wake_up_hour_v1.txt b/metagpt/ext/stanford_town/prompts/wake_up_hour_v1.txt
new file mode 100644
index 000000000..c0a635654
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/wake_up_hour_v1.txt
@@ -0,0 +1,12 @@
+wake_up_hour_v1.txt
+
+Variables: 
+!<INPUT 0>! -- Identity Stable Set
+!<INPUT 1>! -- Lifestyle
+!<INPUT 2>! -- Persona first names
+
+<commentblockmarker>###</commentblockmarker>
+!<INPUT 0>!
+
+In general, !<INPUT 1>!
+!<INPUT 2>!'s wake up hour:
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/prompts/whisper_inner_thought_v1.txt b/metagpt/ext/stanford_town/prompts/whisper_inner_thought_v1.txt
new file mode 100644
index 000000000..b1ed50aaa
--- /dev/null
+++ b/metagpt/ext/stanford_town/prompts/whisper_inner_thought_v1.txt
@@ -0,0 +1,11 @@
+whisper_inner_thought_v1.txt
+
+Variables: 
+!<INPUT 0>! -- init persona name
+!<INPUT 1>! -- whisper
+
+<commentblockmarker>###</commentblockmarker>
+Translate the following thought into a statement about !<INPUT 0>!. 
+
+Thought: "!<INPUT 1>!"
+Statement: "
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/reflect/__init__.py b/metagpt/ext/stanford_town/reflect/__init__.py
new file mode 100644
index 000000000..da486a131
--- /dev/null
+++ b/metagpt/ext/stanford_town/reflect/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : reflection module
diff --git a/metagpt/ext/stanford_town/reflect/reflect.py b/metagpt/ext/stanford_town/reflect/reflect.py
new file mode 100644
index 000000000..954cbc1ac
--- /dev/null
+++ b/metagpt/ext/stanford_town/reflect/reflect.py
@@ -0,0 +1,245 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : Reflect function
+
+import datetime
+import time
+
+from metagpt.ext.stanford_town.actions.run_reflect_action import (
+    AgentChatPoignancy,
+    AgentEventPoignancy,
+    AgentEventTriple,
+    AgentFocusPt,
+    AgentInsightAndGuidance,
+    AgentMemoryOnConvo,
+    AgentPlanThoughtOnConvo,
+)
+from metagpt.ext.stanford_town.memory.retrieve import new_agent_retrieve
+from metagpt.ext.stanford_town.utils.utils import get_embedding
+from metagpt.logs import logger
+
+
+async def generate_focal_points(role: "STRole", n: int = 3):
+    nodes = [
+        [i.last_accessed, i] for i in role.memory.event_list + role.memory.thought_list if "idle" not in i.embedding_key
+    ]
+    nodes = sorted(nodes, key=lambda x: x[0])
+    nodes = [i for _, i in nodes]
+
+    statements = ""
+    for node in nodes[-1 * role.scratch.importance_ele_n :]:
+        statements += node.embedding_key + "\n"
+    run_focal_pt = AgentFocusPt()
+    return await run_focal_pt.run(role, statements, n)
+
+
+async def generate_insights_and_evidence(role: "STRole", nodes: list, n: int = 5):
+    statements = ""
+    for count, node in enumerate(nodes):
+        statements += f"{str(count)}. {node.embedding_key}\n"
+    run_insight_and_guidance = AgentInsightAndGuidance()
+    ret = await run_insight_and_guidance.run(role, statements, n)
+
+    logger.info(ret)
+
+    try:
+        for thought, evi_raw in ret.items():
+            evidence_node_id = [nodes[i].memory_id for i in evi_raw]
+            ret[thought] = evidence_node_id
+        return ret
+    except Exception as exp:
+        logger.error(f"generate_insights_and_evidence error:{exp}")
+        return {"this is blank": "node_1"}
+
+
+async def generate_action_event_triple(act_desp: str, role: "STRole"):
+    """TODO
+
+    INPUT:
+        act_desp: the description of the action (e.g., "sleeping")
+        role: The Persona class instance
+    OUTPUT:
+        a string of emoji that translates action description.
+    EXAMPLE OUTPUT:
+        "🧈🍞"
+    """
+    run_event_triple = AgentEventTriple()
+    result = await run_event_triple.run(act_desp, role)
+    return result
+
+
+async def generate_poig_score(role: "STRole", event_type: str, description: str):
+    if "is idle" in description:
+        return 1
+
+    if event_type == "event" or event_type == "thought":
+        run_event_poignancy = AgentEventPoignancy()
+        return await run_event_poignancy.run(role, description)
+    elif event_type == "chat":
+        run_chat_poignancy = AgentChatPoignancy()
+        return await run_chat_poignancy.run(role, role.scratch.act_description)
+
+
+async def generate_planning_thought_on_convo(role: "STRole", all_utt: str):
+    run_planning_on_convo = AgentPlanThoughtOnConvo()
+    return await run_planning_on_convo.run(role, all_utt)
+
+
+async def generate_memo_on_convo(role: "STRole", all_utt: str):
+    run_memo_on_convo = AgentMemoryOnConvo()
+    return await run_memo_on_convo.run(role, all_utt)
+
+
+# Done
+async def run_reflect(role: "STRole"):
+    """
+    Run the actual reflection. We generate the focal points, retrieve any
+    relevant nodes, and generate thoughts and insights.
+
+    INPUT:
+        role: Current Persona object
+    Output:
+        None
+    """
+    # Reflection requires certain focal points. Generate that first.
+    focal_points = await generate_focal_points(role, 3)
+    # Retrieve the relevant Nodesobject for each of the focal points.
+    # <retrieved> has keys of focal points, and values of the associated Nodes.
+    retrieved = new_agent_retrieve(role, focal_points)
+
+    # For each of the focal points, generate thoughts and save it in the
+    # agent's memory.
+    for focal_pt, nodes in retrieved.items():
+        xx = [i.embedding_key for i in nodes]
+        for xxx in xx:
+            logger.info(f"Nodes retrieved for `{focal_pt}` are `{xxx}`.")
+
+        thoughts = await generate_insights_and_evidence(role, nodes, 5)
+        # 生成的是字典类型
+        for thought, evidence in thoughts.items():
+            created = role.scratch.curr_time
+            expiration = created + datetime.timedelta(days=30)
+            s, p, o = await generate_action_event_triple("(" + thought + ")", role)
+            keywords = set([s, p, o])
+            thought_poignancy = await generate_poig_score(role, "thought", thought)
+            thought_embedding_pair = (thought, get_embedding(thought))
+
+            role.memory.add_thought(
+                created, expiration, s, p, o, thought, keywords, thought_poignancy, thought_embedding_pair, evidence
+            )
+            logger.info(f"add thought memory: {thought}, evidence: {evidence}")
+            time.sleep(2)  # avoid Rate limit
+
+
+def reflection_trigger(role: "STRole"):
+    """
+    Given the current role, determine whether the role should run a
+    reflection.
+
+    Our current implementation checks for whether the sum of the new importance
+    measure has reached the set (hyper-parameter) threshold.
+
+    INPUT:
+        role: Current Persona object
+    Output:
+        True if we are running a new reflection.
+        False otherwise.
+    """
+    logger.info(f"{role.scratch.name} role.scratch.importance_trigger_curr:: {role.scratch.importance_trigger_curr}"),
+
+    if role.scratch.importance_trigger_curr <= 0 and [] != role.memory.event_list + role.memory.thought_list:
+        return True
+    return False
+
+
+# Done
+def reset_reflection_counter(role: "STRole"):
+    """
+    We reset the counters used for the reflection trigger.
+
+    INPUT:
+        role: Current Persona object
+    Output:
+        None
+    """
+    role_imt_max = role.scratch.importance_trigger_max
+    role.scratch.importance_trigger_curr = role_imt_max
+    role.scratch.importance_ele_n = 0
+
+
+async def role_reflect(role: "STRole"):
+    """
+    The main reflection module for the role. We first check if the trigger
+    conditions are met, and if so, run the reflection and reset any of the
+    relevant counters.
+
+    INPUT:
+        role: Current Persona object
+    Output:
+        None
+    """
+    if reflection_trigger(role):
+        await run_reflect(role)
+        reset_reflection_counter(role)
+
+    if role.scratch.chatting_end_time:
+        # update 10 to it's real sec_per_step value
+        if role.scratch.curr_time + datetime.timedelta(0, role.sec_per_step) == role.scratch.chatting_end_time:
+            all_utt = ""
+            if role.scratch.chat:
+                for row in role.scratch.chat:
+                    all_utt += f"{row[0]}: {row[1]}\n"
+
+            last_chat = role.memory.get_last_chat(role.scratch.chatting_with)
+            if last_chat:
+                evidence = [last_chat.memory_id]
+            else:
+                logger.info(f"Role: {role.name} get_last_chat: {last_chat}")
+                return
+
+            planning_thought = await generate_planning_thought_on_convo(role, all_utt)
+            planning_thought = f"For {role.scratch.name}'s planning: {planning_thought}"
+            logger.info(f"Role: {role.name} planning_thought: {planning_thought}")
+
+            created = role.scratch.curr_time
+            expiration = created + datetime.timedelta(days=30)
+            s, p, o = await generate_action_event_triple(planning_thought, role)
+            keywords = set([s, p, o])
+            thought_poignancy = await generate_poig_score(role, "thought", planning_thought)
+            thought_embedding_pair = (planning_thought, get_embedding(planning_thought))
+
+            role.memory.add_thought(
+                created,
+                expiration,
+                s,
+                p,
+                o,
+                planning_thought,
+                keywords,
+                thought_poignancy,
+                thought_embedding_pair,
+                evidence,
+            )
+
+            memo_thought = await generate_memo_on_convo(role, all_utt)
+            memo_thought = f"{role.scratch.name} {memo_thought}"
+
+            created = role.scratch.curr_time
+            expiration = created + datetime.timedelta(days=30)
+            s, p, o = await generate_action_event_triple(memo_thought, role)
+            keywords = set([s, p, o])
+            thought_poignancy = await generate_poig_score(role, "thought", memo_thought)
+            thought_embedding_pair = (memo_thought, get_embedding(memo_thought))
+
+            role.memory.add_thought(
+                created,
+                expiration,
+                s,
+                p,
+                o,
+                memo_thought,
+                keywords,
+                thought_poignancy,
+                thought_embedding_pair,
+                evidence,
+            )
diff --git a/metagpt/ext/stanford_town/roles/__init__.py b/metagpt/ext/stanford_town/roles/__init__.py
new file mode 100644
index 000000000..2bcf8efd0
--- /dev/null
+++ b/metagpt/ext/stanford_town/roles/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/metagpt/ext/stanford_town/roles/st_role.py b/metagpt/ext/stanford_town/roles/st_role.py
new file mode 100644
index 000000000..79f58b07d
--- /dev/null
+++ b/metagpt/ext/stanford_town/roles/st_role.py
@@ -0,0 +1,640 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : Stanford Town role
+
+"""
+Do the steps following:
+- perceive, receive environment(Maze) info
+- retrieve, retrieve memories
+- plan, do plan like long-term plan and interact with Maze
+- reflect, do the High-level thinking based on memories and re-add into the memory
+- execute, move or else in the Maze
+"""
+import math
+import random
+import time
+from datetime import datetime, timedelta
+from operator import itemgetter
+from pathlib import Path
+from typing import TYPE_CHECKING, Optional
+
+from pydantic import ConfigDict, Field, field_validator, model_validator
+
+from metagpt.actions.add_requirement import UserRequirement
+from metagpt.environment.stanford_town.env_space import (
+    EnvAction,
+    EnvActionType,
+    EnvObsParams,
+    EnvObsType,
+)
+from metagpt.ext.stanford_town.actions.dummy_action import DummyAction, DummyMessage
+from metagpt.ext.stanford_town.actions.inner_voice_action import (
+    AgentWhisperThoughtAction,
+)
+from metagpt.ext.stanford_town.actions.run_reflect_action import AgentEventTriple
+from metagpt.ext.stanford_town.memory.agent_memory import AgentMemory, BasicMemory
+from metagpt.ext.stanford_town.memory.scratch import Scratch
+from metagpt.ext.stanford_town.memory.spatial_memory import MemoryTree
+from metagpt.ext.stanford_town.plan.st_plan import plan
+from metagpt.ext.stanford_town.reflect.reflect import generate_poig_score, role_reflect
+from metagpt.ext.stanford_town.utils.const import STORAGE_PATH, collision_block_id
+from metagpt.ext.stanford_town.utils.mg_ga_transform import (
+    get_role_environment,
+    save_environment,
+    save_movement,
+)
+from metagpt.ext.stanford_town.utils.utils import get_embedding, path_finder
+from metagpt.logs import logger
+from metagpt.roles.role import Role, RoleContext
+from metagpt.schema import Message
+from metagpt.utils.common import any_to_str
+
+if TYPE_CHECKING:
+    from metagpt.environment.stanford_town.stanford_town_env import (  # noqa: F401
+        StanfordTownEnv,
+    )
+
+
+class STRoleContext(RoleContext):
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+
+    env: "StanfordTownEnv" = Field(default=None, exclude=True)
+    memory: AgentMemory = Field(default_factory=AgentMemory)
+    scratch: Scratch = Field(default_factory=Scratch)
+    spatial_memory: MemoryTree = Field(default_factory=MemoryTree)
+
+    @classmethod
+    def model_rebuild(cls, **kwargs):
+        from metagpt.environment.stanford_town.stanford_town_env import (  # noqa: F401
+            StanfordTownEnv,
+        )
+
+        super(RoleContext, cls).model_rebuild(**kwargs)
+
+
+class STRole(Role):
+    # add a role's property structure to store role's age and so on like GA's Scratch.
+    model_config = ConfigDict(arbitrary_types_allowed=True, extra="allow")
+
+    name: str = Field(default="Klaus Mueller")
+    profile: str = Field(default="STMember")
+
+    rc: STRoleContext = Field(default_factory=STRoleContext)
+
+    sim_code: str = Field(default="new_sim")
+    step: int = Field(default=0)
+    start_time: Optional[datetime] = Field(default=None)
+    curr_time: Optional[datetime] = Field(default=None)
+    sec_per_step: int = Field(default=10)
+    game_obj_cleanup: dict = Field(default_factory=dict)
+    inner_voice: bool = Field(default=False)
+    has_inner_voice: bool = Field(default=False)
+
+    role_storage_path: Optional[Path] = Field(default=None)
+
+    @field_validator("curr_time", mode="before")
+    @classmethod
+    def check_curr_time(cls, curr_time: str) -> datetime:
+        return datetime.strptime(curr_time, "%B %d, %Y, %H:%M:%S")
+
+    @field_validator("start_time", mode="before")
+    @classmethod
+    def check_start_time(cls, start_time: str) -> datetime:
+        return datetime.strptime(f"{start_time}, 00:00:00", "%B %d, %Y, %H:%M:%S")
+
+    @model_validator(mode="after")
+    def validate_st_role_after(self):
+        self.role_storage_path = STORAGE_PATH.joinpath(f"{self.sim_code}/personas/{self.name}")
+
+        self.load_from()  # load role's memory
+
+        self.set_actions([])
+
+        if self.has_inner_voice:
+            # TODO add communication action
+            self._watch([UserRequirement, DummyAction])
+        else:
+            self._watch([DummyAction])
+
+    async def init_curr_tile(self):
+        # init role
+        role_env: dict = get_role_environment(self.sim_code, self.name, self.step)
+        pt_x = role_env["x"]
+        pt_y = role_env["y"]
+        self.rc.scratch.curr_tile = (pt_x, pt_y)
+
+        self.rc.env.step(
+            EnvAction(
+                action_type=EnvActionType.ADD_TILE_EVENT,
+                coord=(pt_x, pt_y),
+                event=self.scratch.get_curr_event_and_desc(),
+            )
+        )
+
+    @property
+    def scratch(self):
+        return self.rc.scratch
+
+    @property
+    def role_tile(self):
+        return self.scratch.curr_tile
+
+    @property
+    def a_mem(self):
+        return self.rc.memory
+
+    @property
+    def s_mem(self):
+        return self.rc.spatial_memory
+
+    @property
+    def memory(self):
+        return self.rc.memory
+
+    def load_from(self):
+        """
+        load role data from `storage/{simulation_name}/personas/{role_name}`
+        """
+        memory_saved = self.role_storage_path.joinpath("bootstrap_memory/associative_memory")
+        self.rc.memory.set_mem_path(memory_saved)
+
+        sp_mem_saved = self.role_storage_path.joinpath("bootstrap_memory/spatial_memory.json")
+        self.rc.spatial_memory.set_mem_path(f_saved=sp_mem_saved)
+
+        scratch_f_saved = self.role_storage_path.joinpath("bootstrap_memory/scratch.json")
+        self.rc.scratch = Scratch.init_scratch_from_path(f_saved=scratch_f_saved)
+
+        logger.info(f"Role: {self.name} loaded role's memory from {str(self.role_storage_path)}")
+
+    def save_into(self):
+        """
+        save role data from `storage/{simulation_name}/personas/{role_name}`
+        """
+        memory_saved = self.role_storage_path.joinpath("bootstrap_memory/associative_memory")
+        self.rc.memory.save(memory_saved)
+
+        sp_mem_saved = self.role_storage_path.joinpath("bootstrap_memory/spatial_memory.json")
+        self.rc.spatial_memory.save(sp_mem_saved)
+
+        scratch_f_saved = self.role_storage_path.joinpath("bootstrap_memory/scratch.json")
+        self.rc.scratch.save(scratch_f_saved)
+
+        logger.info(f"Role: {self.name} saved role's memory into {str(self.role_storage_path)}")
+
+    async def _observe(self, ignore_memory=False) -> int:
+        if not self.rc.env:
+            return 0
+        news = []
+        if not news:
+            news = self.rc.msg_buffer.pop_all()
+        old_messages = [] if ignore_memory else self.rc.memory.get()
+        # Filter out messages of interest.
+        self.rc.news = [
+            n for n in news if (n.cause_by in self.rc.watch or self.name in n.send_to) and n not in old_messages
+        ]
+
+        if len(self.rc.news) == 1 and self.rc.news[0].cause_by == any_to_str(UserRequirement):
+            logger.warning(f"Role: {self.name} add inner voice: {self.rc.news[0].content}")
+            await self.add_inner_voice(self.rc.news[0].content)
+
+        return 1  # always return 1 to execute role's `_react`
+
+    async def add_inner_voice(self, whisper: str):
+        async def generate_inner_thought(whisper: str):
+            run_whisper_thought = AgentWhisperThoughtAction()
+            inner_thought = await run_whisper_thought.run(self, whisper)
+            return inner_thought
+
+        thought = await generate_inner_thought(whisper)
+
+        # init scratch curr_time with self.curr_time
+        self.inner_voice = True
+        self.rc.scratch.curr_time = self.curr_time
+
+        created = self.rc.scratch.curr_time if self.rc.scratch.curr_time else datetime.now()
+        expiration = created + timedelta(days=30)
+        run_event_triple = AgentEventTriple()
+        s, p, o = await run_event_triple.run(thought, self)
+        keywords = set([s, p, o])
+        thought_poignancy = await generate_poig_score(self, "event", whisper)
+        thought_embedding_pair = (thought, get_embedding(thought))
+        self.rc.memory.add_thought(
+            created, expiration, s, p, o, thought, keywords, thought_poignancy, thought_embedding_pair, None
+        )
+
+    async def observe(self) -> list[BasicMemory]:
+        # TODO observe info from maze_env
+        """
+        Perceive events around the role and saves it to the memory, both events
+        and spaces.
+
+        We first perceive the events nearby the role, as determined by its
+        <vision_r>. If there are a lot of events happening within that radius, we
+        take the <att_bandwidth> of the closest events. Finally, we check whether
+        any of them are new, as determined by <retention>. If they are new, then we
+        save those and return the <BasicMemory> instances for those events.
+
+        OUTPUT:
+            ret_events: a list of <BasicMemory> that are perceived and new.
+        """
+        # PERCEIVE SPACE
+        # We get the nearby tiles given our current tile and the persona's vision
+        # radius.
+        nearby_tiles = self.rc.env.observe(
+            EnvObsParams(
+                obs_type=EnvObsType.TILE_NBR, coord=self.rc.scratch.curr_tile, vision_radius=self.rc.scratch.vision_r
+            )
+        )
+
+        # We then store the perceived space. Note that the s_mem of the persona is
+        # in the form of a tree constructed using dictionaries.
+        for tile in nearby_tiles:
+            tile_info = self.rc.env.observe(EnvObsParams(obs_type=EnvObsType.GET_TITLE, coord=tile))
+            self.rc.spatial_memory.add_tile_info(tile_info)
+
+        # PERCEIVE EVENTS.
+        # We will perceive events that take place in the same arena as the
+        # persona's current arena.
+
+        curr_arena_path = self.rc.env.observe(
+            EnvObsParams(obs_type=EnvObsType.TILE_PATH, coord=self.rc.scratch.curr_tile, level="arena")
+        )
+
+        # We do not perceive the same event twice (this can happen if an object is
+        # extended across multiple tiles).
+        percept_events_set = set()
+        # We will order our percept based on the distance, with the closest ones
+        # getting priorities.
+        percept_events_list = []
+        # First, we put all events that are occuring in the nearby tiles into the
+        # percept_events_list
+        for tile in nearby_tiles:
+            tile_details = self.rc.env.observe(EnvObsParams(obs_type=EnvObsType.GET_TITLE, coord=tile))
+            if tile_details["events"]:
+                tmp_arena_path = self.rc.env.observe(
+                    EnvObsParams(obs_type=EnvObsType.TILE_PATH, coord=tile, level="arena")
+                )
+
+                if tmp_arena_path == curr_arena_path:
+                    # This calculates the distance between the persona's current tile,
+                    # and the target tile.
+                    dist = math.dist([tile[0], tile[1]], [self.rc.scratch.curr_tile[0], self.rc.scratch.curr_tile[1]])
+                    # Add any relevant events to our temp set/list with the distant info.
+                    for event in tile_details["events"]:
+                        if event not in percept_events_set:
+                            percept_events_list += [[dist, event]]
+                            percept_events_set.add(event)
+
+        # We sort, and perceive only self.rc.scratch.att_bandwidth of the closest
+        # events. If the bandwidth is larger, then it means the persona can perceive
+        # more elements within a small area.
+        percept_events_list = sorted(percept_events_list, key=itemgetter(0))
+        perceived_events = []
+        for dist, event in percept_events_list[: self.rc.scratch.att_bandwidth]:
+            perceived_events += [event]
+
+        # Storing events.
+        # <ret_events> is a list of <BasicMemory> instances from the persona's
+        # associative memory.
+        ret_events = []
+        for p_event in perceived_events:
+            s, p, o, desc = p_event
+            if not p:
+                # If the object is not present, then we default the event to "idle".
+                p = "is"
+                o = "idle"
+                desc = "idle"
+            desc = f"{s.split(':')[-1]} is {desc}"
+            p_event = (s, p, o)
+
+            # We retrieve the latest self.rc.scratch.retention events. If there is
+            # something new that is happening (that is, p_event not in latest_events),
+            # then we add that event to the a_mem and return it.
+            latest_events = self.rc.memory.get_summarized_latest_events(self.rc.scratch.retention)
+            if p_event not in latest_events:
+                # We start by managing keywords.
+                keywords = set()
+                sub = p_event[0]
+                obj = p_event[2]
+                if ":" in p_event[0]:
+                    sub = p_event[0].split(":")[-1]
+                if ":" in p_event[2]:
+                    obj = p_event[2].split(":")[-1]
+                keywords.update([sub, obj])
+
+                # Get event embedding
+                desc_embedding_in = desc
+                if "(" in desc:
+                    desc_embedding_in = desc_embedding_in.split("(")[1].split(")")[0].strip()
+                if desc_embedding_in in self.rc.memory.embeddings:
+                    event_embedding = self.rc.memory.embeddings[desc_embedding_in]
+                else:
+                    event_embedding = get_embedding(desc_embedding_in)
+                event_embedding_pair = (desc_embedding_in, event_embedding)
+
+                # Get event poignancy.
+                event_poignancy = await generate_poig_score(self, "event", desc_embedding_in)
+                logger.debug(f"Role {self.name} event_poignancy: {event_poignancy}")
+
+                # If we observe the persona's self chat, we include that in the memory
+                # of the persona here.
+                chat_node_ids = []
+                if p_event[0] == f"{self.name}" and p_event[1] == "chat with":
+                    curr_event = self.rc.scratch.act_event
+                    if self.rc.scratch.act_description in self.rc.memory.embeddings:
+                        chat_embedding = self.rc.memory.embeddings[self.rc.scratch.act_description]
+                    else:
+                        chat_embedding = get_embedding(self.rc.scratch.act_description)
+                    chat_embedding_pair = (self.rc.scratch.act_description, chat_embedding)
+                    chat_poignancy = await generate_poig_score(self, "chat", self.rc.scratch.act_description)
+                    chat_node = self.rc.memory.add_chat(
+                        self.rc.scratch.curr_time,
+                        None,
+                        curr_event[0],
+                        curr_event[1],
+                        curr_event[2],
+                        self.rc.scratch.act_description,
+                        keywords,
+                        chat_poignancy,
+                        chat_embedding_pair,
+                        self.rc.scratch.chat,
+                    )
+                    chat_node_ids = [chat_node.memory_id]
+
+                # Finally, we add the current event to the agent's memory.
+                ret_events += [
+                    self.rc.memory.add_event(
+                        self.rc.scratch.curr_time,
+                        None,
+                        s,
+                        p,
+                        o,
+                        desc,
+                        keywords,
+                        event_poignancy,
+                        event_embedding_pair,
+                        chat_node_ids,
+                    )
+                ]
+                self.rc.scratch.importance_trigger_curr -= event_poignancy
+                self.rc.scratch.importance_ele_n += 1
+
+        return ret_events
+
+    def retrieve(self, observed: list) -> dict:
+        # TODO retrieve memories from agent_memory
+        retrieved = dict()
+        for event in observed:
+            retrieved[event.description] = dict()
+            retrieved[event.description]["curr_event"] = event
+
+            relevant_events = self.rc.memory.retrieve_relevant_events(event.subject, event.predicate, event.object)
+            retrieved[event.description]["events"] = list(relevant_events)
+
+            relevant_thoughts = self.rc.memory.retrieve_relevant_thoughts(event.subject, event.predicate, event.object)
+            retrieved[event.description]["thoughts"] = list(relevant_thoughts)
+
+        return retrieved
+
+    async def reflect(self):
+        # TODO reflection if meet reflect condition
+        await role_reflect(self)
+        # TODO re-add result to memory
+        # 已封装到Reflect函数之中
+
+    async def execute(self, plan: str):
+        """
+        Args:
+            plan: This is a string address of the action we need to execute.
+            It comes in the form of "{world}:{sector}:{arena}:{game_objects}".
+            It is important that you access this without doing negative
+            indexing (e.g., [-1]) because the latter address elements may not be
+            present in some cases.
+            e.g., "dolores double studio:double studio:bedroom 1:bed"
+        """
+        roles = self.rc.env.get_roles()
+        if "<random>" in plan and self.rc.scratch.planned_path == []:
+            self.rc.scratch.act_path_set = False
+
+        # <act_path_set> is set to True if the path is set for the current action.
+        # It is False otherwise, and means we need to construct a new path.
+        if not self.rc.scratch.act_path_set:
+            # <target_tiles> is a list of tile coordinates where the persona may go
+            # to execute the current action. The goal is to pick one of them.
+            target_tiles = None
+            logger.info(f"Role {self.name} plan: {plan}")
+
+            if "<persona>" in plan:
+                # Executing persona-persona interaction.
+                target_p_tile = roles[plan.split("<persona>")[-1].strip()].scratch.curr_tile
+                collision_maze = self.rc.env.observe()["collision_maze"]
+                potential_path = path_finder(
+                    collision_maze, self.rc.scratch.curr_tile, target_p_tile, collision_block_id
+                )
+                if len(potential_path) <= 2:
+                    target_tiles = [potential_path[0]]
+                else:
+                    collision_maze = self.rc.env.observe()["collision_maze"]
+                    potential_1 = path_finder(
+                        collision_maze,
+                        self.rc.scratch.curr_tile,
+                        potential_path[int(len(potential_path) / 2)],
+                        collision_block_id,
+                    )
+
+                    potential_2 = path_finder(
+                        collision_maze,
+                        self.rc.scratch.curr_tile,
+                        potential_path[int(len(potential_path) / 2) + 1],
+                        collision_block_id,
+                    )
+                    if len(potential_1) <= len(potential_2):
+                        target_tiles = [potential_path[int(len(potential_path) / 2)]]
+                    else:
+                        target_tiles = [potential_path[int(len(potential_path) / 2 + 1)]]
+
+            elif "<waiting>" in plan:
+                # Executing interaction where the persona has decided to wait before
+                # executing their action.
+                x = int(plan.split()[1])
+                y = int(plan.split()[2])
+                target_tiles = [[x, y]]
+
+            elif "<random>" in plan:
+                # Executing a random location action.
+                plan = ":".join(plan.split(":")[:-1])
+
+                address_tiles = self.rc.env.observe()["address_tiles"]
+                target_tiles = address_tiles[plan]
+                target_tiles = random.sample(list(target_tiles), 1)
+
+            else:
+                # This is our default execution. We simply take the persona to the
+                # location where the current action is taking place.
+                # Retrieve the target addresses. Again, plan is an action address in its
+                # string form. <maze.address_tiles> takes this and returns candidate
+                # coordinates.
+                address_tiles = self.rc.env.observe()["address_tiles"]
+                if plan not in address_tiles:
+                    address_tiles["Johnson Park:park:park garden"]  # ERRORRRRRRR
+                else:
+                    target_tiles = address_tiles[plan]
+
+            # There are sometimes more than one tile returned from this (e.g., a tabe
+            # may stretch many coordinates). So, we sample a few here. And from that
+            # random sample, we will take the closest ones.
+            if len(target_tiles) < 4:
+                target_tiles = random.sample(list(target_tiles), len(target_tiles))
+            else:
+                target_tiles = random.sample(list(target_tiles), 4)
+            # If possible, we want personas to occupy different tiles when they are
+            # headed to the same location on the maze. It is ok if they end up on the
+            # same time, but we try to lower that probability.
+            # We take care of that overlap here.
+            persona_name_set = set(roles.keys())
+            new_target_tiles = []
+            for i in target_tiles:
+                access_tile = self.rc.env.observe(EnvObsParams(obs_type=EnvObsType.GET_TITLE, coord=i))
+                curr_event_set = access_tile["events"]
+                pass_curr_tile = False
+                for j in curr_event_set:
+                    if j[0] in persona_name_set:
+                        pass_curr_tile = True
+                if not pass_curr_tile:
+                    new_target_tiles += [i]
+            if len(new_target_tiles) == 0:
+                new_target_tiles = target_tiles
+            target_tiles = new_target_tiles
+
+            # Now that we've identified the target tile, we find the shortest path to
+            # one of the target tiles.
+            curr_tile = self.rc.scratch.curr_tile
+            closest_target_tile = None
+            path = None
+            for i in target_tiles:
+                # path_finder takes a collision_mze and the curr_tile coordinate as
+                # an input, and returns a list of coordinate tuples that becomes the
+                # path.
+                # e.g., [(0, 1), (1, 1), (1, 2), (1, 3), (1, 4)...]
+                collision_maze = self.rc.env.observe()["collision_maze"]
+                curr_path = path_finder(collision_maze, curr_tile, i, collision_block_id)
+                if not closest_target_tile:
+                    closest_target_tile = i
+                    path = curr_path
+                elif len(curr_path) < len(path):
+                    closest_target_tile = i
+                    path = curr_path
+
+            # Actually setting the <planned_path> and <act_path_set>. We cut the
+            # first element in the planned_path because it includes the curr_tile.
+            self.rc.scratch.planned_path = path[1:]
+            self.rc.scratch.act_path_set = True
+
+        # Setting up the next immediate step. We stay at our curr_tile if there is
+        # no <planned_path> left, but otherwise, we go to the next tile in the path.
+        ret = self.rc.scratch.curr_tile
+        if self.rc.scratch.planned_path:
+            ret = self.rc.scratch.planned_path[0]
+            self.rc.scratch.planned_path = self.rc.scratch.planned_path[1:]
+
+        description = f"{self.rc.scratch.act_description}"
+        description += f" @ {self.rc.scratch.act_address}"
+
+        execution = ret, self.rc.scratch.act_pronunciatio, description
+        return execution
+
+    async def update_role_env(self) -> bool:
+        role_env = get_role_environment(self.sim_code, self.name, self.step)
+        ret = True
+        if role_env:
+            for key, val in self.game_obj_cleanup.items():
+                self.rc.env.step(EnvAction(action_type=EnvActionType.TURN_TILE_EVENT_IDLE, coord=val, event=key))
+
+            # reset game_obj_cleanup
+            self.game_obj_cleanup = dict()
+            curr_tile = self.role_tile
+            new_tile = (role_env["x"], role_env["y"])
+            self.rc.env.step(
+                EnvAction(action_type=EnvActionType.RM_TITLE_SUB_EVENT, coord=curr_tile, subject=self.name)
+            )
+            self.rc.env.step(
+                EnvAction(
+                    action_type=EnvActionType.ADD_TILE_EVENT,
+                    coord=new_tile,
+                    event=self.scratch.get_curr_event_and_desc(),
+                )
+            )
+
+            # the persona will travel to get to their destination. *Once*
+            # the persona gets there, we activate the object action.
+            if not self.scratch.planned_path:
+                self.game_obj_cleanup[self.scratch.get_curr_event_and_desc()] = new_tile
+                self.rc.env.step(
+                    EnvAction(
+                        action_type=EnvActionType.ADD_TILE_EVENT,
+                        coord=new_tile,
+                        event=self.scratch.get_curr_event_and_desc(),
+                    )
+                )
+
+                blank = (self.scratch.get_curr_obj_event_and_desc()[0], None, None, None)
+                self.rc.env.step(EnvAction(action_type=EnvActionType.RM_TILE_EVENT, coord=new_tile, event=blank))
+
+            # update role's new tile
+            self.rc.scratch.curr_tile = new_tile
+        else:
+            ret = False
+            time.sleep(1)
+            logger.warning(
+                f"{self.sim_code}/environment/{self.step}.json not exist or parses failed, " f"sleep 1s and re-check"
+            )
+        return ret
+
+    async def _react(self) -> Message:
+        # update role env
+        ret = await self.update_role_env()
+        if not ret:
+            # TODO add message
+            logger.info(f"Role: {self.name} update_role_env return False")
+            return DummyMessage()
+
+        new_day = False
+        if not self.scratch.curr_time or self.inner_voice:
+            new_day = "First day"
+        elif self.scratch.curr_time.strftime("%A %B %d") != self.curr_time.strftime("%A %B %d"):
+            new_day = "New day"
+        logger.info(f"Role: {self.name} new_day: {new_day}")
+        self.rc.scratch.curr_time = self.curr_time
+
+        # get maze_env from self.rc.env, and observe env info
+        observed = await self.observe()
+
+        # use self.rc.memory 's retrieve functions
+        retrieved = self.retrieve(observed)
+
+        plans = await plan(self, self.rc.env.get_roles(), new_day, retrieved)
+
+        await self.reflect()
+
+        # feed-back into maze_env
+        next_tile, pronunciatio, description = await self.execute(plans)
+        role_move = {
+            "movement": next_tile,
+            "pronunciatio": pronunciatio,
+            "description": description,
+            "chat": self.scratch.chat,
+        }
+        save_movement(self.name, role_move, step=self.step, sim_code=self.sim_code, curr_time=self.curr_time)
+
+        # step update
+        logger.info(f"Role: {self.name} run at {self.step} step on {self.curr_time} at tile: {self.scratch.curr_tile}")
+        self.step += 1
+        save_environment(self.name, self.step, self.sim_code, next_tile)
+        self.curr_time += timedelta(seconds=self.sec_per_step)
+        self.inner_voice = False
+
+        time.sleep(0.5)
+        return DummyMessage()
+
+
+STRoleContext.model_rebuild()
diff --git a/metagpt/ext/stanford_town/stanford_town.py b/metagpt/ext/stanford_town/stanford_town.py
new file mode 100644
index 000000000..96f6a4b4e
--- /dev/null
+++ b/metagpt/ext/stanford_town/stanford_town.py
@@ -0,0 +1,45 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : StanfordTown to works like SoftwareCompany
+
+from typing import Any, Optional
+
+from metagpt.context import Context
+from metagpt.environment import StanfordTownEnv
+from metagpt.ext.stanford_town.roles.st_role import STRole
+from metagpt.ext.stanford_town.utils.const import MAZE_ASSET_PATH
+from metagpt.logs import logger
+from metagpt.team import Team
+
+
+class StanfordTown(Team):
+    env: Optional[StanfordTownEnv] = None
+
+    def __init__(self, context: Context = None, **data: Any):
+        super(Team, self).__init__(**data)
+        ctx = context or Context()
+        if not self.env:
+            self.env = StanfordTownEnv(context=ctx, maze_asset_path=MAZE_ASSET_PATH)
+        else:
+            self.env.context = ctx  # The `env` object is allocated by deserialization
+
+    async def hire(self, roles: list[STRole]):
+        logger.warning(f"The Town add {len(roles)} roles, and start to operate.")
+        super().hire(roles)
+        for role in roles:
+            await role.init_curr_tile()
+
+    async def run(self, n_round: int = 3):
+        """Run company until target round or no money"""
+        while n_round > 0:
+            n_round -= 1
+            logger.debug(f"{n_round=}")
+            self._check_balance()
+            await self.env.run()
+
+        # save simulation result including environment and roles after all rounds
+        roles = self.env.get_roles()
+        for profile, role in roles.items():
+            role.save_into()
+
+        return self.env.history
diff --git a/metagpt/ext/stanford_town/static_dirs/assets/the_ville/agent_history_init_n25.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/agent_history_init_n25.csv
new file mode 100644
index 000000000..6f36e91ba
--- /dev/null
+++ b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/agent_history_init_n25.csv
@@ -0,0 +1,26 @@
+Name,Whisper
+Latoya Williams,"Rajiv Patel is your housemate whom you've known for about a year; You and Rajiv Patel sometimes talk about politics and local elections; Abigail Chan is your housemate whom you've known for about a year; Francisco Lopez is your housemate whom you've known for about a year; Haily Johnson is your housemate whom you've known for about a year but you don't really find her too comfortable; In terms of your daily plans, you sometimes spend time at The Rose and Crown Pub when it's late; You have known the bartender at The Rose and Crown Pub, Arthur Burton for about half a year; You like to talk about politics and local elections"
+Rajiv Patel,"Latoya Williams is your housemate whom you've known for about a year; You and Latoya Williams sometimes talk about politics and local elections; Abigail Chan is your housemate whom you've known for about a year and you think she is kind of cute; Francisco Lopez is your housemate whom you've known for about a year; Haily Johnson is your housemate whom you've known for about a year but you don't really find her too comfortable; You sometimes try to spend time at Hobbs Cafe but you haven't really talked to anyone there yet; In terms of your daily plans, you sometimes spend time at The Rose and Crown Pub when it's late and you have known the bartender, Arthur Burton for about a year; You like to talk about politics and local elections"
+Abigail Chen,You think you are kind of cute; You and Latoya Williams are housemates and have known each other for about a year; You and Rajiv Patel are housemates and have known each other for about a year and you two are somewhat close; You and Francisco Lopez are housemates and have known each other for about a year; You and Hailey Johnson are housemates and have known each other for about a year
+Francisco Lopez,"You and Latoya Williams are housemates and have known each other for about a year; You and Rajiv Patel are housemates and have known each other for about a year; You and Abigail Chen are housemates and have known each other for about a year; You and Hailey Johnson are housemates and have known each other for about a year but you don't really like her too much; You have a secret crush on Abigail Chen but so far, you haven't had the courage to ask her out; You think Abigail Chen is cute; You frequent Hobbs Cafe"
+Hailey Johnson,"You want to be acknowledged by everyone; You've known Isabella Rodriguez for about a year and you talk to her often about the piece you are currently writing; Latoya Williams is your housemate whom you've known for about a year and you think she is somewhat cute; Rajiv Patel is your housemate whom you've known for about a year, but you don't know much about him; Abigail Chen is a housemate whom you've known for about a year, but you haven't really talked to her yet; Francisco Lopez is your housemate and you two have known each other for quite awhile because you are from the same town; You are interested in meeting someone; You are interested in romantically dating someone; You are not seeing anyone right now "
+Arthur Burton,"You are generally nice to all your customers and listen to their story; You and Isabella Rodriguez are friends; You've known Isabella Rodriguez for a few years since she runs Hobbs Cafe right next to your bar; You know Latoya Williams as a customer at your bar, The Rose and Crown Pub; You know Rajiv Patel as a customer at your bar, The Rose and Crown Pub; You know Ryan Park as a customer at your bar, The Rose and Crown Pub; You know Carlos Gomez as a customer at your bar, The Rose and Crown Pub; You know Adam Smith as a customer at your bar, The Rose and Crown Pub; You know Yuriko Yamamoto as a customer at your bar, The Rose and Crown Pub; You know Jennifer Moore as a customer at your bar, The Rose and Crown Pub; You know Sam Moore as a customer at your bar, The Rose and Crown Pub; You know Carmen Ortiz as a customer at your bar, The Rose and Crown Pub; You know Tom Moreno as a customer at your bar, The Rose and Crown Pub; You don't like it when people fight at your bar"
+Ryan Park,"You frequent Hobbs Cafe to work and think and eat; You've known Isabella Rodriguez for about a year; You know Isabella Rodriguez works at Hobbs Cafe; You frequent The Rose and Crown Pub to eat dinner; You've known the bartender at The Rose and Crown Pub, Arthur Burton, for about a year; You've known Giorgio Rossi, your next door neighbor, for about a year; You've known Carlos Gomez, your neighbor, for about a year; You wonder why Giorgio Rossi and Carlos Gomez are always fighting; You want no part in Giorgio Rossi and Carlos Gomez's fight"
+Isabella Rodriguez,"You are excited to be planning a Valentine's Day party at *Hobbs Cafe on February 14th from 5pm* and you are eager to tell everyone to come to the party; You and Maria Lopez have known each other for about a year ever since Maria Lopez visited Hobbs Cafe and are good friends; Maria Lopez is a loyal friend to you and a frequent customer at Hobbs Cafe;  You see Tamara Taylor as a frequent customer at your cafe, Hobbs Cafe; You and Tamara Taylor have known each other for a few months; You and Carlos Gomez have known each other for about 4 years; You know that Carlos Gomez is a good poet and you like his poem; You see Ryan Park frequently when he visits your cafe, Hobbs Cafe; You often see Ryan Park working hard on his laptop and you think he is dedicated in his work, which you find to be cool; Hailey Johnson is a frequent customer at your cafe, Hobbs Cafe; You find Haily Johnson to be a little uncomfortable because she is too pushy; You know Giorgio Rossi as a customer at your Hobbs Cafe; You know Wolfgang Schulz as a customer at Hobbs Cafe; You know Carmen Ortiz as a customer at Hobbs Cafe; You and Arthur Burton are friends; You've known Arthur Burton for a few years since he runs a bar right next door"
+Giorgio Rossi,"You do not like Carlos Gomez; You think Carlos Gomez is annoying; You think Carlos Gomez is pushy; You think Carlos Gomez is a coward; You've known Carlos Gomez, your next door neighbor, for about two years; You think Carlos Gomez is really loud and you have filed complaints against him before; For planning, you frequent Hobbs Cafe to hang out and write and think; you are friends with Isabella Rodriguez who works at Hobbs Cafe; You think Isabella Rodriguez is kind-hearted; You and Ryan Park sometimes talk about random things; You've known Ryan Park for about a year living as his neighbor; You would rather not see Carlos Gomez ever"
+Carlos Gomez,"You do not like Giorgio Rossi; You think Giorgio Rossi is annoying; You think Giorgio Rossi is a coward; You've known Giorgio Rossi, your next door neighbor, for about two years; For planning, you frequent The Rose and Crown Pub at night to eat and drink; you are friends with Arthur Burton who is a bartender at the pub; You've known Ryan Park for about a year living as his neighbor; You would rather not see Giorgio Rossi ever; You want Ryan Park to take your side in his fight against Giorgio Rossi"
+Klaus Mueller,"This is very important -- you have a crush on Maria Lopez; You and Maria Lopez have known each other for over 2 years now; You and Maria Lopez are close friends and classmates; You are close with Ayesha Khan, who is a classmate in one of your classes and a dormmate; You and Maria Lopez are dormmates; You and Eddy Lin are classmates; You know Mei Lin is a professor at your college; You and Wolfgang Schulz are classmates and dormmates"
+Maria Lopez,"This is very important -- you have a secret crush on Klaus Mueller; You and Klaus Mueller have known each other for over 2 years now; You and Klaus Mueller are close friends and classmates; For planning, you frequent Hobbs Cafe for studying; You are close with Ayesha Khan, who is a classmate in one of your classes and a dormmate; You and Eddy Lin are classmates; You know Mei Lin is a professor at your college; You and Wolfgang Schulz are classmates and dormmates"
+Ayesha Khan,"You are close with Wolfgang Schulz, who is a classmate in one of your classes and a dormmate; You and Maria Lopez are dormmates; You and Klaus Mueller are dormmates; You and Eddy Lin are classmates; You know Mei Lin is a professor at your college"
+Wolfgang Schulz,"For planning, you frequent Hobbs Cafe for studying; You are close with Ayesha Khan, who is a classmate in one of your classes and a dormmate; You and Maria Lopez are dormmates; You and Klaus Mueller are dormmates; You and Eddy Lin are classmates and you two sometimes talk about your favorite music; You know Mei Lin is a professor at your college; You've met Isabella Rodriguez who works at the cafe but have not really talked to her"
+Mei Lin,"You are a professor who loves teaching; You've known your neighbor, Yuriko Yamamoto, since the time she helped you with some legal matters; You've known your next door old couple, Sam Moore and Jennifer Moore, for a few years; You think Sam Moore is a kind and nice man; You like Jennifer Moore's art; You know of Tamara Taylor who live next block but you haven't really chatted with her; You've known Carmen Ortiz for a year or so as your neighbor; You know the Moreno family somewhat well -- the husband Tom Moreno and the wife Jane Moreno; You know that Tom Moreno and your husband, John Lin, are colleagues at The Willows Market and Pharmacy; John Lin is your husband who works at the Pharmacy section of The Willows Market and Pharmacy; Eddy Lin is your son who studies music theory at the college; You love your family very much; You think your son, Eddy Lin, has been a little rebellious recently"
+John Lin,"You like to talk about politics and local elections; You are really curious about who will run for the local mayor election that is coming up in a few months; You've known your neighbor, Yuriko Yamamoto, since the time she helped you with some legal matters; You've known your next door old couple, Sam Moore and Jennifer Moore, for a few years; You think Sam Moore is a kind and nice man; You like Jennifer Moore's art; You know of Tamara Taylor who live next block but you haven't really chatted with her; You've known Carmen Ortiz for a year or so as your neighbor; You and Tom Moreno are colleagues at The Willows Market and Pharmacy; You know the Moreno family somewhat well -- the husband Tom Moreno and the wife Jane Moreno; Mei Lin is your wife who is a professor; Eddy Lin is your son who studies music theory at the college; You love your family very much"
+Eddy Lin,"You are a music student at the Oak Hill College; You are working on a new music composition; You like hip hop music; You like to attach ""Yo"" at the end of your sentences; You've known your neighbor, Yuriko Yamamoto, for a few years since she helped your parents with some legal matters; You've known your next door old couple, Sam Moore and Jennifer Moore, for a few years; You know of Tamara Taylor who live next block but you haven't really chatted with her; You've known Carmen Ortiz for a year or so as your neighbor; You know the Moreno family somewhat well -- the husband Tom Moreno and the wife Jane Moreno; You know that Tom Moreno and your father, John Lin, are colleagues at The Willows Market and Pharmacy; John Lin is your father who works at the Pharmacy section of The Willows Market and Pharmacy; Mei Lin is your mother who teaches at the Oak Hill Collrhr; You love your family very much; You think your mother, Mei Lin, is a little too uptight; You and Wolfgang Schulz are schoolmates; You and Ayesha Khan are school mates; You and Maria Lopez are schoolmates"
+Tom Moreno,"You like to express your opinions; You are loud; You like to talk about politics and local elections; You've known your neighbor, Yuriko Yamamoto, for a few years and you two sometimes chat about the local election; You've known your next door old couple, Sam Moore and Jennifer Moore, for a few years; You don't really like Sam Moore; You know of Tamara Taylor who live next block but you haven't really chatted with her; You've known Carmen Ortiz for a year or so as your neighbor; In terms of your daily plans, you frequent The Rose and Crown Pub at night; You've knonw the bartender Arthur Burton for a few years; You sometimes talk to Adam Smith about local elections; You and John Lin are colleagues at The Willows Market and Pharmacy; You know the Lin family somewhat well -- the husband John Lin, wife, Mei Lin, and the son Eddy Lin; you know Mei Lin is a professor; Jane Moreno is your wife -- you love her but your relationship with her has been strained recently"
+Jane Moreno,"You don't really care about politics; You've known your neighbor, Yuriko Yamamoto, for a few years; You've known your next door old couple, Sam Moore and Jennifer Moore, for a few years; You think Sam Moore is a kind and nice man; You know of Tamara Taylor who live next block but you haven't really chatted with her; You've known Carmen Ortiz for a year or so as your neighbor; You know the Lin family somewhat well since they are your neighbor -- the husband John Lin, wife, Mei Lin, and the son Eddy Lin; you know Mei Lin is a professor; Tom Moreno is your husband -- you love him but your relationship with him has been strained recently"
+Tamara Taylor,"You just moved in; Carmen Ortiz is your housemate; You don't really know any one in town because you justn moved in, but you are looking forward to meeting more people"
+Carmen Ortiz,"You are somehwat curious about who will run for the local mayor election that is coming up in a few months; Tamara Taylor is your housemate who just moved in; Tamara Taylor just moved in so she doesn't know many peopl in town; You've known your neighbor, Yuriko Yamamoto, for a few years and you two sometimes chat about the local election; You've known your next door old couple, Sam Moore and Jennifer Moore, for a few years; You've known the couple, Tom Moreno and Jane Moreno, who live in the next block for a few years; In terms of your daily plans, you frequent Hobbs Cafe; You've knonw the bartender Arthur Burton for a few years; You've known Isabella Rodriguez the owner at Hobbs Cafe for a few years"
+Sam Moore,"You are thinking of running in the upcoming local mayor election; You are telling people that you are running for the upcoming local mayor election; You've known your neighbor, Adam Smith, for a few years; You consider Adam Smith to be a very close friend of yours although he is much younger than you; You've known your neighbor, Yuriko Yamamoto, for a few years since the time she helped you and your wife Jennifer Moore on some legal matters; You consider Yuriko Yamamoto to be someone like your daughter even though you two are not related; You've known Carmen Ortiz for a year or so as your neighbor; You've known the couple, Tom Moreno and Jane Moreno, who live in the next block for a few years; You think Tom Moreno is a little too aggressive and opinionated; You've known the bartender Arthur Burton for a few years; You've known the Lin family, Mei, John, and the son Eddy Lin, for a few years since they live next block; In terms of your plan, you like to take a walk in the park;"
+Jennifer Moore,"You don't really care about politics; You've known your neighbor, Adam Smith, for a few years; You've known your neighbor, Yuriko Yamamoto, for a few years since the time she helped you and your husband Sam Moore on some legal matters; You consider Yuriko Yamamoto to be someone like your daughter even though you two are not related; You've known Carmen Ortiz for a year or so as your neighbor; You've known the couple, Tom Moreno and Jane Moreno, who live in the next block for a few years; You think Tom Moreno is a little too aggressive and opinionated; You've known the bartender Arthur Burton for a few years; You've known the Lin family, Mei, John, and the son Eddy Lin, for a few years since they live next block; You love your husband, Sam Moore and hope he has relaxing days; You know Sam Moore, your husband, is planning on running for the local mayor election but you do not want him to as it will be too taxing for him "
+Yuriko Yamamoto,"You like to talk about politics and local elections; You've known your neighbor, Adam Smith, for a few years and you two sometimes chat about the local election; You've known your next door old couple, Sam Moore and Jennifer Moore, for a few years; You and Sam Moore are somewhat close; You've known Carmen Ortiz for a year or so as your neighbor; You've known the couple, Tom Moreno and Jane Moreno, who live in the next block for a few years; You think Tom Moreno is a little too aggressive and opinionated; You've knonw the bartender Arthur Burton for a few years; You've known the Lin family, Mei, John, and the son Eddy Lin, for a few years since the time you helped them with some legal matter"
+Adam Smith,"You like to talk about politics and local elections; You are really curious about who will run for the local mayor election that is coming up in a few months; You've known your neighbor, Yuriko Yamamoto, for a few years and you two sometimes chat about the local election; You've known your next door old couple, Sam Moore and Jennifer Moore, for a few years; You and Sam Moore are somewhat close; You view Sam Moore as something of a mentor; You know of Tamara Taylor who live next block but you haven't really chatted with her; You've known Carmen Ortiz for a year or so as your neighbor; You've known the couple, Tom Moreno and Jane Moreno, who live in the next block for a few years; You think Tom Moreno is a little too aggressive and opinionated; In terms of your daily plans, you frequent The Rose and Crown Pub at night; You've knonw the bartender Arthur Burton for a few years"
\ No newline at end of file
diff --git a/metagpt/ext/stanford_town/static_dirs/assets/the_ville/agent_history_init_n3.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/agent_history_init_n3.csv
new file mode 100644
index 000000000..04e6c933f
--- /dev/null
+++ b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/agent_history_init_n3.csv
@@ -0,0 +1,4 @@
+Name,Whisper
+Maria Lopez,This is very important -- you have a secret crush on Klaus Mueller; You and Klaus Mueller have known each other for over 2 years now; You and Klaus Mueller are close friends and classmates; You and Isabella Rodriguez who works at Hobbs Cafe are close friends; For planning, you frequent Hobbs Cafe for studying
+Klaus Mueller,This is very important -- you have a crush on Maria Lopez; You and Maria Lopez have known each other for over 2 years now; You and Maria Lopez are close friends and classmates; You and Maria Lopez are dormmates; You and Isabella Rodriguez are aquintances since Isabella works at Hobbs Cafe that you frequent
+Isabella Rodriguez,You are excited to be planning a Valentine's Day party at *Hobbs Cafe on February 14th from 5pm* and you are eager to tell everyone to come to the party; You and Maria Lopez have known each other for about a year ever since Maria Lopez visited Hobbs Cafe and are good friends; Maria Lopez is a loyal friend to you and a frequent customer at Hobbs Cafe; Klaus Mueller is a frequent customer at Hobbs Cafe; you love your work at Hobbs Cafe
\ No newline at end of file
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/maze/arena_maze.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze/arena_maze.csv
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/maze/arena_maze.csv
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze/arena_maze.csv
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/maze/collision_maze.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze/collision_maze.csv
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/maze/collision_maze.csv
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze/collision_maze.csv
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/maze/game_object_maze.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze/game_object_maze.csv
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/maze/game_object_maze.csv
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze/game_object_maze.csv
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/maze/sector_maze.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze/sector_maze.csv
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/maze/sector_maze.csv
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze/sector_maze.csv
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/maze/spawning_location_maze.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze/spawning_location_maze.csv
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/maze/spawning_location_maze.csv
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze/spawning_location_maze.csv
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/maze_meta_info.json b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze_meta_info.json
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/maze_meta_info.json
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/maze_meta_info.json
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/special_blocks/arena_blocks.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/special_blocks/arena_blocks.csv
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/special_blocks/arena_blocks.csv
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/special_blocks/arena_blocks.csv
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/special_blocks/game_object_blocks.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/special_blocks/game_object_blocks.csv
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/special_blocks/game_object_blocks.csv
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/special_blocks/game_object_blocks.csv
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/special_blocks/sector_blocks.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/special_blocks/sector_blocks.csv
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/special_blocks/sector_blocks.csv
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/special_blocks/sector_blocks.csv
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/special_blocks/spawning_location_blocks.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/special_blocks/spawning_location_blocks.csv
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/special_blocks/spawning_location_blocks.csv
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/special_blocks/spawning_location_blocks.csv
diff --git a/tests/data/environment/stanford_town/the_ville/matrix/special_blocks/world_blocks.csv b/metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/special_blocks/world_blocks.csv
similarity index 100%
rename from tests/data/environment/stanford_town/the_ville/matrix/special_blocks/world_blocks.csv
rename to metagpt/ext/stanford_town/static_dirs/assets/the_ville/matrix/special_blocks/world_blocks.csv
diff --git a/metagpt/ext/stanford_town/utils/__init__.py b/metagpt/ext/stanford_town/utils/__init__.py
new file mode 100644
index 000000000..2bcf8efd0
--- /dev/null
+++ b/metagpt/ext/stanford_town/utils/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/metagpt/ext/stanford_town/utils/const.py b/metagpt/ext/stanford_town/utils/const.py
new file mode 100644
index 000000000..7a5c6fd24
--- /dev/null
+++ b/metagpt/ext/stanford_town/utils/const.py
@@ -0,0 +1,15 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
+
+from pathlib import Path
+
+from metagpt.const import EXAMPLE_PATH
+
+ST_ROOT_PATH = Path(__file__).parent.parent
+STORAGE_PATH = EXAMPLE_PATH.joinpath("stanford_town/storage")
+TEMP_STORAGE_PATH = EXAMPLE_PATH.joinpath("stanford_town/temp_storage")
+MAZE_ASSET_PATH = ST_ROOT_PATH.joinpath("static_dirs/assets/the_ville")
+PROMPTS_DIR = ST_ROOT_PATH.joinpath("prompts")
+
+collision_block_id = "32125"
diff --git a/metagpt/ext/stanford_town/utils/mg_ga_transform.py b/metagpt/ext/stanford_town/utils/mg_ga_transform.py
new file mode 100644
index 000000000..e0de76a6b
--- /dev/null
+++ b/metagpt/ext/stanford_town/utils/mg_ga_transform.py
@@ -0,0 +1,65 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : data transform of mg <-> ga under storage
+
+from pathlib import Path
+from typing import Optional
+
+from metagpt.ext.stanford_town.utils.const import STORAGE_PATH, TEMP_STORAGE_PATH
+from metagpt.logs import logger
+from metagpt.utils.common import read_json_file, write_json_file
+
+
+def get_reverie_meta(sim_code: str) -> dict:
+    meta_file_path = STORAGE_PATH.joinpath(sim_code).joinpath("reverie/meta.json")
+    reverie_meta = read_json_file(meta_file_path)
+    return reverie_meta
+
+
+def save_movement(role_name: str, role_move: dict, step: int, sim_code: str, curr_time: str):
+    movement_path = STORAGE_PATH.joinpath(f"{sim_code}/movement/{step}.json")
+    if not movement_path.parent.exists():
+        movement_path.parent.mkdir(exist_ok=True)
+    if movement_path.exists():
+        movement = read_json_file(movement_path)
+    else:
+        movement = {"persona": dict(), "meta": dict()}
+    movement["persona"][role_name] = role_move
+    movement["meta"]["curr_time"] = curr_time.strftime("%B %d, %Y, %H:%M:%S")
+
+    write_json_file(movement_path, movement)
+    logger.info(f"save_movement at step: {step}, curr_time: {movement['meta']['curr_time']}")
+
+
+def save_environment(role_name: str, step: int, sim_code: str, movement: list[int]):
+    environment_path = STORAGE_PATH.joinpath(f"{sim_code}/environment/{step}.json")
+    if not environment_path.parent.exists():
+        environment_path.parent.mkdir(exist_ok=True)
+    if environment_path.exists():
+        environment = read_json_file(environment_path)
+    else:
+        environment = {}
+
+    environment[role_name] = {"maze": "the_ville", "x": movement[0], "y": movement[1]}
+    write_json_file(environment_path, environment)
+    logger.info(f"save_environment at step: {step}")
+
+
+def get_role_environment(sim_code: str, role_name: str, step: int = 0) -> dict:
+    env_path = STORAGE_PATH.joinpath(f"{sim_code}/environment/{step}.json")
+    role_env = None
+    if env_path.exists():
+        env_info = read_json_file(env_path)
+        role_env = env_info.get(role_name, None)
+
+    return role_env
+
+
+def write_curr_sim_code(curr_sim_code: dict, temp_storage_path: Optional[Path] = None):
+    temp_storage_path = Path(temp_storage_path) or TEMP_STORAGE_PATH
+    write_json_file(temp_storage_path.joinpath("curr_sim_code.json"), curr_sim_code)
+
+
+def write_curr_step(curr_step: dict, temp_storage_path: Optional[Path] = None):
+    temp_storage_path = Path(temp_storage_path) or TEMP_STORAGE_PATH
+    write_json_file(temp_storage_path.joinpath("curr_step.json"), curr_step)
diff --git a/metagpt/ext/stanford_town/utils/utils.py b/metagpt/ext/stanford_town/utils/utils.py
new file mode 100644
index 000000000..3aa0e80e8
--- /dev/null
+++ b/metagpt/ext/stanford_town/utils/utils.py
@@ -0,0 +1,225 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : utils
+
+import csv
+import errno
+import json
+import os
+import shutil
+import time
+from pathlib import Path
+from typing import Union
+
+from openai import OpenAI
+
+from metagpt.config2 import config
+from metagpt.logs import logger
+
+
+def read_csv_to_list(curr_file: str, header=False, strip_trail=True):
+    """
+    Reads in a csv file to a list of list. If header is True, it returns a
+    tuple with (header row, all rows)
+    ARGS:
+      curr_file: path to the current csv file.
+    RETURNS:
+      List of list where the component lists are the rows of the file.
+    """
+    logger.debug(f"start read csv: {curr_file}")
+    if not header:
+        analysis_list = []
+        with open(curr_file) as f_analysis_file:
+            data_reader = csv.reader(f_analysis_file, delimiter=",")
+            for count, row in enumerate(data_reader):
+                if strip_trail:
+                    row = [i.strip() for i in row]
+                analysis_list += [row]
+        return analysis_list
+    else:
+        analysis_list = []
+        with open(curr_file) as f_analysis_file:
+            data_reader = csv.reader(f_analysis_file, delimiter=",")
+            for count, row in enumerate(data_reader):
+                if strip_trail:
+                    row = [i.strip() for i in row]
+                analysis_list += [row]
+        return analysis_list[0], analysis_list[1:]
+
+
+def get_embedding(text, model: str = "text-embedding-ada-002"):
+    text = text.replace("\n", " ")
+    if not text:
+        text = "this is blank"
+    for idx in range(3):
+        try:
+            embedding = (
+                OpenAI(api_key=config.llm.api_key).embeddings.create(input=[text], model=model).data[0].embedding
+            )
+        except Exception:
+            time.sleep(5)
+    if not embedding:
+        raise ValueError("get_embedding failed")
+    return embedding
+
+
+def extract_first_json_dict(data_str: str) -> Union[None, dict]:
+    # Find the first occurrence of a JSON object within the string
+    start_idx = data_str.find("{")
+    end_idx = data_str.find("}", start_idx) + 1
+
+    # Check if both start and end indices were found
+    if start_idx == -1 or end_idx == 0:
+        return None
+
+    # Extract the first JSON dictionary
+    json_str = data_str[start_idx:end_idx]
+
+    try:
+        # Attempt to parse the JSON data
+        json_dict = json.loads(json_str)
+        return json_dict
+    except json.JSONDecodeError:
+        # If parsing fails, return None
+        return None
+
+
+def path_finder_v2(a, start, end, collision_block_char) -> list[int]:
+    def make_step(m, k):
+        for i in range(len(m)):
+            for j in range(len(m[i])):
+                if m[i][j] == k:
+                    if i > 0 and m[i - 1][j] == 0 and a[i - 1][j] == 0:
+                        m[i - 1][j] = k + 1
+                    if j > 0 and m[i][j - 1] == 0 and a[i][j - 1] == 0:
+                        m[i][j - 1] = k + 1
+                    if i < len(m) - 1 and m[i + 1][j] == 0 and a[i + 1][j] == 0:
+                        m[i + 1][j] = k + 1
+                    if j < len(m[i]) - 1 and m[i][j + 1] == 0 and a[i][j + 1] == 0:
+                        m[i][j + 1] = k + 1
+
+    new_maze = []
+    for row in a:
+        new_row = []
+        for j in row:
+            if j == collision_block_char:
+                new_row += [1]
+            else:
+                new_row += [0]
+        new_maze += [new_row]
+    a = new_maze
+
+    m = []
+    for i in range(len(a)):
+        m.append([])
+        for j in range(len(a[i])):
+            m[-1].append(0)
+    i, j = start
+    m[i][j] = 1
+
+    k = 0
+    except_handle = 150
+    while m[end[0]][end[1]] == 0:
+        k += 1
+        make_step(m, k)
+
+        if except_handle == 0:
+            break
+        except_handle -= 1
+
+    i, j = end
+    k = m[i][j]
+    the_path = [(i, j)]
+    while k > 1:
+        if i > 0 and m[i - 1][j] == k - 1:
+            i, j = i - 1, j
+            the_path.append((i, j))
+            k -= 1
+        elif j > 0 and m[i][j - 1] == k - 1:
+            i, j = i, j - 1
+            the_path.append((i, j))
+            k -= 1
+        elif i < len(m) - 1 and m[i + 1][j] == k - 1:
+            i, j = i + 1, j
+            the_path.append((i, j))
+            k -= 1
+        elif j < len(m[i]) - 1 and m[i][j + 1] == k - 1:
+            i, j = i, j + 1
+            the_path.append((i, j))
+            k -= 1
+
+    the_path.reverse()
+    return the_path
+
+
+def path_finder(collision_maze: list, start: list[int], end: list[int], collision_block_char: str) -> list[int]:
+    # EMERGENCY PATCH
+    start = (start[1], start[0])
+    end = (end[1], end[0])
+    # END EMERGENCY PATCH
+
+    path = path_finder_v2(collision_maze, start, end, collision_block_char)
+
+    new_path = []
+    for i in path:
+        new_path += [(i[1], i[0])]
+    path = new_path
+
+    return path
+
+
+def create_folder_if_not_there(curr_path):
+    """
+    Checks if a folder in the curr_path exists. If it does not exist, creates
+    the folder.
+    Note that if the curr_path designates a file location, it will operate on
+    the folder that contains the file. But the function also works even if the
+    path designates to just a folder.
+    Args:
+        curr_list: list to write. The list comes in the following form:
+                   [['key1', 'val1-1', 'val1-2'...],
+                    ['key2', 'val2-1', 'val2-2'...],]
+        outfile: name of the csv file to write
+    RETURNS:
+        True: if a new folder is created
+        False: if a new folder is not created
+    """
+    outfolder_name = curr_path.split("/")
+    if len(outfolder_name) != 1:
+        # This checks if the curr path is a file or a folder.
+        if "." in outfolder_name[-1]:
+            outfolder_name = outfolder_name[:-1]
+
+        outfolder_name = "/".join(outfolder_name)
+        if not os.path.exists(outfolder_name):
+            os.makedirs(outfolder_name)
+            return True
+
+    return False
+
+
+def find_filenames(path_to_dir, suffix=".csv"):
+    """
+    Given a directory, find all files that end with the provided suffix and
+    return their paths.
+    ARGS:
+        path_to_dir: Path to the current directory
+        suffix: The target suffix.
+    RETURNS:
+        A list of paths to all files in the directory.
+    """
+    filenames = os.listdir(path_to_dir)
+    return [path_to_dir + "/" + filename for filename in filenames if filename.endswith(suffix)]
+
+
+def copy_folder(src_folder: str, dest_folder: str):
+    try:
+        if Path(dest_folder).exists():
+            logger.warning(f"{dest_folder} exist, start to remove.")
+            shutil.rmtree(dest_folder)
+        shutil.copytree(src_folder, dest_folder)
+    except OSError as exc:  # python >2.5
+        if exc.errno in (errno.ENOTDIR, errno.EINVAL):
+            shutil.copy(src_folder, dest_folder)
+        else:
+            raise
diff --git a/metagpt/learn/skill_loader.py b/metagpt/learn/skill_loader.py
index bcf28bb87..e98f73cf9 100644
--- a/metagpt/learn/skill_loader.py
+++ b/metagpt/learn/skill_loader.py
@@ -9,11 +9,11 @@
 from pathlib import Path
 from typing import Dict, List, Optional
 
-import aiofiles
 import yaml
 from pydantic import BaseModel, Field
 
 from metagpt.context import Context
+from metagpt.utils.common import aread
 
 
 class Example(BaseModel):
@@ -68,8 +68,7 @@ class SkillsDeclaration(BaseModel):
     async def load(skill_yaml_file_name: Path = None) -> "SkillsDeclaration":
         if not skill_yaml_file_name:
             skill_yaml_file_name = Path(__file__).parent.parent.parent / "docs/.well-known/skills.yaml"
-        async with aiofiles.open(str(skill_yaml_file_name), mode="r") as reader:
-            data = await reader.read(-1)
+        data = await aread(filename=skill_yaml_file_name)
         skill_data = yaml.safe_load(data)
         return SkillsDeclaration(**skill_data)
 
diff --git a/metagpt/memory/longterm_memory.py b/metagpt/memory/longterm_memory.py
index 5a139a93b..e960ad6ec 100644
--- a/metagpt/memory/longterm_memory.py
+++ b/metagpt/memory/longterm_memory.py
@@ -29,16 +29,14 @@ class LongTermMemory(Memory):
     msg_from_recover: bool = False
 
     def recover_memory(self, role_id: str, rc: RoleContext):
-        messages = self.memory_storage.recover_memory(role_id)
+        self.memory_storage.recover_memory(role_id)
         self.rc = rc
         if not self.memory_storage.is_initialized:
-            logger.warning(f"It may the first time to run Agent {role_id}, the long-term memory is empty")
+            logger.warning(f"It may the first time to run Role {role_id}, the long-term memory is empty")
         else:
-            logger.warning(
-                f"Agent {role_id} has existing memory storage with {len(messages)} messages " f"and has recovered them."
-            )
+            logger.warning(f"Role {role_id} has existing memory storage and has recovered them.")
         self.msg_from_recover = True
-        self.add_batch(messages)
+        # self.add_batch(messages) # TODO no need
         self.msg_from_recover = False
 
     def add(self, message: Message):
@@ -49,7 +47,7 @@ class LongTermMemory(Memory):
                 # and ignore adding messages from recover repeatedly
                 self.memory_storage.add(message)
 
-    def find_news(self, observed: list[Message], k=0) -> list[Message]:
+    async def find_news(self, observed: list[Message], k=0) -> list[Message]:
         """
         find news (previously unseen messages) from the the most recent k memories, from all memories when k=0
             1. find the short-term memory(stm) news
@@ -63,11 +61,14 @@ class LongTermMemory(Memory):
         ltm_news: list[Message] = []
         for mem in stm_news:
             # filter out messages similar to those seen previously in ltm, only keep fresh news
-            mem_searched = self.memory_storage.search_dissimilar(mem)
-            if len(mem_searched) > 0:
+            mem_searched = await self.memory_storage.search_similar(mem)
+            if len(mem_searched) == 0:
                 ltm_news.append(mem)
         return ltm_news[-k:]
 
+    def persist(self):
+        self.memory_storage.persist()
+
     def delete(self, message: Message):
         super().delete(message)
         # TODO delete message in memory_storage
diff --git a/metagpt/memory/memory_storage.py b/metagpt/memory/memory_storage.py
index fa04d8138..88ab49028 100644
--- a/metagpt/memory/memory_storage.py
+++ b/metagpt/memory/memory_storage.py
@@ -3,115 +3,75 @@
 """
 @Desc   : the implement of memory storage
 """
-
+import shutil
 from pathlib import Path
-from typing import Optional
 
-from langchain.vectorstores.faiss import FAISS
-from langchain_core.embeddings import Embeddings
+from llama_index.core.embeddings import BaseEmbedding
 
 from metagpt.const import DATA_PATH, MEM_TTL
-from metagpt.document_store.faiss_store import FaissStore
 from metagpt.logs import logger
+from metagpt.rag.engines.simple import SimpleEngine
+from metagpt.rag.schema import FAISSIndexConfig, FAISSRetrieverConfig
 from metagpt.schema import Message
 from metagpt.utils.embedding import get_embedding
-from metagpt.utils.serialize import deserialize_message, serialize_message
 
 
-class MemoryStorage(FaissStore):
+class MemoryStorage(object):
     """
     The memory storage with Faiss as ANN search engine
     """
 
-    def __init__(self, mem_ttl: int = MEM_TTL, embedding: Embeddings = None):
+    def __init__(self, mem_ttl: int = MEM_TTL, embedding: BaseEmbedding = None):
         self.role_id: str = None
         self.role_mem_path: str = None
         self.mem_ttl: int = mem_ttl  # later use
         self.threshold: float = 0.1  # experience value. TODO The threshold to filter similar memories
         self._initialized: bool = False
-
         self.embedding = embedding or get_embedding()
-        self.store: FAISS = None  # Faiss engine
+
+        self.faiss_engine = None
 
     @property
     def is_initialized(self) -> bool:
         return self._initialized
 
-    def _load(self) -> Optional["FaissStore"]:
-        index_file, store_file = self._get_index_and_store_fname(index_ext=".faiss")  # langchain FAISS using .faiss
-
-        if not (index_file.exists() and store_file.exists()):
-            logger.info("Missing at least one of index_file/store_file, load failed and return None")
-            return None
-
-        return FAISS.load_local(self.role_mem_path, self.embedding, self.role_id)
-
     def recover_memory(self, role_id: str) -> list[Message]:
         self.role_id = role_id
         self.role_mem_path = Path(DATA_PATH / f"role_mem/{self.role_id}/")
         self.role_mem_path.mkdir(parents=True, exist_ok=True)
+        self.cache_dir = self.role_mem_path
 
-        self.store = self._load()
-        messages = []
-        if not self.store:
-            # TODO init `self.store` under here with raw faiss api instead under `add`
-            pass
+        if self.role_mem_path.joinpath("default__vector_store.json").exists():
+            self.faiss_engine = SimpleEngine.from_index(
+                index_config=FAISSIndexConfig(persist_path=self.cache_dir),
+                retriever_configs=[FAISSRetrieverConfig()],
+                embed_model=self.embedding,
+            )
         else:
-            for _id, document in self.store.docstore._dict.items():
-                messages.append(deserialize_message(document.metadata.get("message_ser")))
-            self._initialized = True
-
-        return messages
-
-    def _get_index_and_store_fname(self, index_ext=".index", pkl_ext=".pkl"):
-        if not self.role_mem_path:
-            logger.error(f"You should call {self.__class__.__name__}.recover_memory fist when using LongTermMemory")
-            return None, None
-        index_fpath = Path(self.role_mem_path / f"{self.role_id}{index_ext}")
-        storage_fpath = Path(self.role_mem_path / f"{self.role_id}{pkl_ext}")
-        return index_fpath, storage_fpath
-
-    def persist(self):
-        self.store.save_local(self.role_mem_path, self.role_id)
-        logger.debug(f"Agent {self.role_id} persist memory into local")
+            self.faiss_engine = SimpleEngine.from_objs(
+                objs=[], retriever_configs=[FAISSRetrieverConfig()], embed_model=self.embedding
+            )
+        self._initialized = True
 
     def add(self, message: Message) -> bool:
         """add message into memory storage"""
-        docs = [message.content]
-        metadatas = [{"message_ser": serialize_message(message)}]
-        if not self.store:
-            # init Faiss
-            self.store = self._write(docs, metadatas)
-            self._initialized = True
-        else:
-            self.store.add_texts(texts=docs, metadatas=metadatas)
-        self.persist()
-        logger.info(f"Agent {self.role_id}'s memory_storage add a message")
+        self.faiss_engine.add_objs([message])
+        logger.info(f"Role {self.role_id}'s memory_storage add a message")
 
-    def search_dissimilar(self, message: Message, k=4) -> list[Message]:
-        """search for dissimilar messages"""
-        if not self.store:
-            return []
-
-        resp = self.store.similarity_search_with_score(query=message.content, k=k)
+    async def search_similar(self, message: Message, k=4) -> list[Message]:
+        """search for similar messages"""
         # filter the result which score is smaller than the threshold
         filtered_resp = []
-        for item, score in resp:
-            # the smaller score means more similar relation
-            if score < self.threshold:
-                continue
-            # convert search result into Memory
-            metadata = item.metadata
-            new_mem = deserialize_message(metadata.get("message_ser"))
-            filtered_resp.append(new_mem)
+        resp = await self.faiss_engine.aretrieve(message.content)
+        for item in resp:
+            if item.score < self.threshold:
+                filtered_resp.append(item.metadata.get("obj"))
         return filtered_resp
 
     def clean(self):
-        index_fpath, storage_fpath = self._get_index_and_store_fname()
-        if index_fpath and index_fpath.exists():
-            index_fpath.unlink(missing_ok=True)
-        if storage_fpath and storage_fpath.exists():
-            storage_fpath.unlink(missing_ok=True)
-
-        self.store = None
+        shutil.rmtree(self.cache_dir, ignore_errors=True)
         self._initialized = False
+
+    def persist(self):
+        if self.faiss_engine:
+            self.faiss_engine.retriever._index.storage_context.persist(self.cache_dir)
diff --git a/metagpt/provider/anthropic_api.py b/metagpt/provider/anthropic_api.py
index 872f9b2c7..1aeacbe83 100644
--- a/metagpt/provider/anthropic_api.py
+++ b/metagpt/provider/anthropic_api.py
@@ -5,6 +5,7 @@ from anthropic import AsyncAnthropic
 from anthropic.types import Message, Usage
 
 from metagpt.configs.llm_config import LLMConfig, LLMType
+from metagpt.const import USE_CONFIG_TIMEOUT
 from metagpt.logs import log_llm_stream
 from metagpt.provider.base_llm import BaseLLM
 from metagpt.provider.llm_provider_registry import register_provider
@@ -41,15 +42,15 @@ class AnthropicLLM(BaseLLM):
     def get_choice_text(self, resp: Message) -> str:
         return resp.content[0].text
 
-    async def _achat_completion(self, messages: list[dict], timeout: int = 3) -> Message:
+    async def _achat_completion(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> Message:
         resp: Message = await self.aclient.messages.create(**self._const_kwargs(messages))
         self._update_costs(resp.usage, self.model)
         return resp
 
-    async def acompletion(self, messages: list[dict], timeout: int = 3) -> Message:
-        return await self._achat_completion(messages, timeout=timeout)
+    async def acompletion(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> Message:
+        return await self._achat_completion(messages, timeout=self.get_timeout(timeout))
 
-    async def _achat_completion_stream(self, messages: list[dict], timeout: int = 3) -> str:
+    async def _achat_completion_stream(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> str:
         stream = await self.aclient.messages.create(**self._const_kwargs(messages, stream=True))
         collected_content = []
         usage = Usage(input_tokens=0, output_tokens=0)
diff --git a/metagpt/provider/base_llm.py b/metagpt/provider/base_llm.py
index fa14496aa..db2757ec3 100644
--- a/metagpt/provider/base_llm.py
+++ b/metagpt/provider/base_llm.py
@@ -10,10 +10,9 @@ from __future__ import annotations
 
 import json
 from abc import ABC, abstractmethod
-from typing import Dict, Optional, Union
+from typing import Optional, Union
 
 from openai import AsyncOpenAI
-from openai.types import CompletionUsage
 from pydantic import BaseModel
 from tenacity import (
     after_log,
@@ -24,11 +23,11 @@ from tenacity import (
 )
 
 from metagpt.configs.llm_config import LLMConfig
+from metagpt.const import LLM_API_TIMEOUT, USE_CONFIG_TIMEOUT
 from metagpt.logs import logger
 from metagpt.schema import Message
 from metagpt.utils.common import log_and_reraise
 from metagpt.utils.cost_manager import CostManager, Costs
-from metagpt.utils.exceptions import handle_exception
 
 
 class BaseLLM(ABC):
@@ -41,7 +40,7 @@ class BaseLLM(ABC):
     # OpenAI / Azure / Others
     aclient: Optional[Union[AsyncOpenAI]] = None
     cost_manager: Optional[CostManager] = None
-    model: Optional[str] = None
+    model: Optional[str] = None  # deprecated
     pricing_plan: Optional[str] = None
 
     @abstractmethod
@@ -75,6 +74,28 @@ class BaseLLM(ABC):
     def _system_msg(self, msg: str) -> dict[str, str]:
         return {"role": "system", "content": msg}
 
+    def format_msg(self, messages: Union[str, Message, list[dict], list[Message], list[str]]) -> list[dict]:
+        """convert messages to list[dict]."""
+        from metagpt.schema import Message
+
+        if not isinstance(messages, list):
+            messages = [messages]
+
+        processed_messages = []
+        for msg in messages:
+            if isinstance(msg, str):
+                processed_messages.append({"role": "user", "content": msg})
+            elif isinstance(msg, dict):
+                assert set(msg.keys()) == set(["role", "content"])
+                processed_messages.append(msg)
+            elif isinstance(msg, Message):
+                processed_messages.append(msg.to_dict())
+            else:
+                raise ValueError(
+                    f"Only support message type are: str, Message, dict, but got {type(messages).__name__}!"
+                )
+        return processed_messages
+
     def _system_msgs(self, msgs: list[str]) -> list[dict[str, str]]:
         return [self._system_msg(msg) for msg in msgs]
 
@@ -88,6 +109,7 @@ class BaseLLM(ABC):
             local_calc_usage (bool): some models don't calculate usage, it will overwrite LLMConfig.calc_usage
         """
         calc_usage = self.config.calc_usage and local_calc_usage
+        model = model or self.pricing_plan
         model = model or self.model
         usage = usage.model_dump() if isinstance(usage, BaseModel) else usage
         if calc_usage and self.cost_manager:
@@ -109,7 +131,7 @@ class BaseLLM(ABC):
         system_msgs: Optional[list[str]] = None,
         format_msgs: Optional[list[dict[str, str]]] = None,
         images: Optional[Union[str, list[str]]] = None,
-        timeout=3,
+        timeout=USE_CONFIG_TIMEOUT,
         stream=True,
     ) -> str:
         if system_msgs:
@@ -125,31 +147,31 @@ class BaseLLM(ABC):
         else:
             message.extend(msg)
         logger.debug(message)
-        rsp = await self.acompletion_text(message, stream=stream, timeout=timeout)
+        rsp = await self.acompletion_text(message, stream=stream, timeout=self.get_timeout(timeout))
         return rsp
 
     def _extract_assistant_rsp(self, context):
         return "\n".join([i["content"] for i in context if i["role"] == "assistant"])
 
-    async def aask_batch(self, msgs: list, timeout=3) -> str:
+    async def aask_batch(self, msgs: list, timeout=USE_CONFIG_TIMEOUT) -> str:
         """Sequential questioning"""
         context = []
         for msg in msgs:
             umsg = self._user_msg(msg)
             context.append(umsg)
-            rsp_text = await self.acompletion_text(context, timeout=timeout)
+            rsp_text = await self.acompletion_text(context, timeout=self.get_timeout(timeout))
             context.append(self._assistant_msg(rsp_text))
         return self._extract_assistant_rsp(context)
 
-    async def aask_code(self, messages: Union[str, Message, list[dict]], timeout=3, **kwargs) -> dict:
+    async def aask_code(self, messages: Union[str, Message, list[dict]], timeout=USE_CONFIG_TIMEOUT, **kwargs) -> dict:
         raise NotImplementedError
 
     @abstractmethod
-    async def _achat_completion(self, messages: list[dict], timeout=3):
+    async def _achat_completion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT):
         """_achat_completion implemented by inherited class"""
 
     @abstractmethod
-    async def acompletion(self, messages: list[dict], timeout=3):
+    async def acompletion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT):
         """Asynchronous version of completion
         All GPTAPIs are required to provide the standard OpenAI completion interface
         [
@@ -160,7 +182,7 @@ class BaseLLM(ABC):
         """
 
     @abstractmethod
-    async def _achat_completion_stream(self, messages: list[dict], timeout: int = 3) -> str:
+    async def _achat_completion_stream(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> str:
         """_achat_completion_stream implemented by inherited class"""
 
     @retry(
@@ -170,11 +192,13 @@ class BaseLLM(ABC):
         retry=retry_if_exception_type(ConnectionError),
         retry_error_callback=log_and_reraise,
     )
-    async def acompletion_text(self, messages: list[dict], stream: bool = False, timeout: int = 3) -> str:
+    async def acompletion_text(
+        self, messages: list[dict], stream: bool = False, timeout: int = USE_CONFIG_TIMEOUT
+    ) -> str:
         """Asynchronous version of completion. Return str. Support stream-print"""
         if stream:
-            return await self._achat_completion_stream(messages, timeout=timeout)
-        resp = await self._achat_completion(messages, timeout=timeout)
+            return await self._achat_completion_stream(messages, timeout=self.get_timeout(timeout))
+        resp = await self._achat_completion(messages, timeout=self.get_timeout(timeout))
         return self.get_choice_text(resp)
 
     def get_choice_text(self, rsp: dict) -> str:
@@ -225,20 +249,6 @@ class BaseLLM(ABC):
         """
         return json.loads(self.get_choice_function(rsp)["arguments"], strict=False)
 
-    @handle_exception
-    def _update_costs(self, usage: CompletionUsage | Dict):
-        """
-        Updates the costs based on the provided usage information.
-        """
-        if self.config.calc_usage and usage and self.cost_manager:
-            if isinstance(usage, Dict):
-                prompt_tokens = int(usage.get("prompt_tokens", 0))
-                completion_tokens = int(usage.get("completion_tokens", 0))
-            else:
-                prompt_tokens = usage.prompt_tokens
-                completion_tokens = usage.completion_tokens
-            self.cost_manager.update_cost(prompt_tokens, completion_tokens, self.pricing_plan)
-
     def messages_to_prompt(self, messages: list[dict]):
         """[{"role": "user", "content": msg}] to user: <msg> etc."""
         return "\n".join([f"{i['role']}: {i['content']}" for i in messages])
@@ -246,3 +256,11 @@ class BaseLLM(ABC):
     def messages_to_dict(self, messages):
         """objects to [{"role": "user", "content": msg}] etc."""
         return [i.to_dict() for i in messages]
+
+    def with_model(self, model: str):
+        """Set model and return self. For example, `with_model("gpt-3.5-turbo")`."""
+        self.config.model = model
+        return self
+
+    def get_timeout(self, timeout: int) -> int:
+        return timeout or self.config.timeout or LLM_API_TIMEOUT
diff --git a/metagpt/provider/dashscope_api.py b/metagpt/provider/dashscope_api.py
index 21f3ef351..82224e893 100644
--- a/metagpt/provider/dashscope_api.py
+++ b/metagpt/provider/dashscope_api.py
@@ -25,6 +25,7 @@ from dashscope.common.error import (
     UnsupportedApiProtocol,
 )
 
+from metagpt.const import USE_CONFIG_TIMEOUT
 from metagpt.logs import log_llm_stream
 from metagpt.provider.base_llm import BaseLLM, LLMConfig
 from metagpt.provider.llm_provider_registry import LLMType, register_provider
@@ -202,16 +203,16 @@ class DashScopeLLM(BaseLLM):
         self._update_costs(dict(resp.usage))
         return resp.output
 
-    async def _achat_completion(self, messages: list[dict], timeout: int = 3) -> GenerationOutput:
+    async def _achat_completion(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> GenerationOutput:
         resp: GenerationResponse = await self.aclient.acall(**self._const_kwargs(messages, stream=False))
         self._check_response(resp)
         self._update_costs(dict(resp.usage))
         return resp.output
 
-    async def acompletion(self, messages: list[dict], timeout=3) -> GenerationOutput:
-        return await self._achat_completion(messages, timeout=timeout)
+    async def acompletion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> GenerationOutput:
+        return await self._achat_completion(messages, timeout=self.get_timeout(timeout))
 
-    async def _achat_completion_stream(self, messages: list[dict], timeout: int = 3) -> str:
+    async def _achat_completion_stream(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> str:
         resp = await self.aclient.acall(**self._const_kwargs(messages, stream=True))
         collected_content = []
         usage = {}
diff --git a/metagpt/provider/general_api_base.py b/metagpt/provider/general_api_base.py
index 1b9149396..8e5da8f16 100644
--- a/metagpt/provider/general_api_base.py
+++ b/metagpt/provider/general_api_base.py
@@ -573,7 +573,7 @@ class APIRequestor:
                 total=request_timeout[1],
             )
         else:
-            timeout = aiohttp.ClientTimeout(total=request_timeout if request_timeout else TIMEOUT_SECS)
+            timeout = aiohttp.ClientTimeout(total=request_timeout or TIMEOUT_SECS)
 
         if files:
             # TODO: Use `aiohttp.MultipartWriter` to create the multipart form data here.
diff --git a/metagpt/provider/google_gemini_api.py b/metagpt/provider/google_gemini_api.py
index 09e554205..e4b3a3f17 100644
--- a/metagpt/provider/google_gemini_api.py
+++ b/metagpt/provider/google_gemini_api.py
@@ -1,8 +1,10 @@
 #!/usr/bin/env python
 # -*- coding: utf-8 -*-
 # @Desc   : Google Gemini LLM from https://ai.google.dev/tutorials/python_quickstart
-
-from typing import Optional, Union
+import json
+import os
+from dataclasses import asdict
+from typing import List, Optional, Union
 
 import google.generativeai as genai
 from google.ai import generativelanguage as glm
@@ -10,14 +12,17 @@ from google.generativeai.generative_models import GenerativeModel
 from google.generativeai.types import content_types
 from google.generativeai.types.generation_types import (
     AsyncGenerateContentResponse,
+    BlockedPromptException,
     GenerateContentResponse,
     GenerationConfig,
 )
 
 from metagpt.configs.llm_config import LLMConfig, LLMType
-from metagpt.logs import log_llm_stream
+from metagpt.const import USE_CONFIG_TIMEOUT
+from metagpt.logs import log_llm_stream, logger
 from metagpt.provider.base_llm import BaseLLM
 from metagpt.provider.llm_provider_registry import register_provider
+from metagpt.schema import Message
 
 
 class GeminiGenerativeModel(GenerativeModel):
@@ -51,6 +56,10 @@ class GeminiLLM(BaseLLM):
         self.llm = GeminiGenerativeModel(model_name=self.model)
 
     def __init_gemini(self, config: LLMConfig):
+        if config.proxy:
+            logger.info(f"Use proxy: {config.proxy}")
+            os.environ["http_proxy"] = config.proxy
+            os.environ["https_proxy"] = config.proxy
         genai.configure(api_key=config.api_key)
 
     def _user_msg(self, msg: str, images: Optional[Union[str, list[str]]] = None) -> dict[str, str]:
@@ -61,6 +70,35 @@ class GeminiLLM(BaseLLM):
     def _assistant_msg(self, msg: str) -> dict[str, str]:
         return {"role": "model", "parts": [msg]}
 
+    def _system_msg(self, msg: str) -> dict[str, str]:
+        return {"role": "user", "parts": [msg]}
+
+    def format_msg(self, messages: Union[str, Message, list[dict], list[Message], list[str]]) -> list[dict]:
+        """convert messages to list[dict]."""
+        from metagpt.schema import Message
+
+        if not isinstance(messages, list):
+            messages = [messages]
+
+        # REF: https://ai.google.dev/tutorials/python_quickstart
+        # As a dictionary, the message requires `role` and `parts` keys.
+        # The role in a conversation can either be the `user`, which provides the prompts,
+        # or `model`, which provides the responses.
+        processed_messages = []
+        for msg in messages:
+            if isinstance(msg, str):
+                processed_messages.append({"role": "user", "parts": [msg]})
+            elif isinstance(msg, dict):
+                assert set(msg.keys()) == set(["role", "parts"])
+                processed_messages.append(msg)
+            elif isinstance(msg, Message):
+                processed_messages.append({"role": "user" if msg.role == "user" else "model", "parts": [msg.content]})
+            else:
+                raise ValueError(
+                    f"Only support message type are: str, Message, dict, but got {type(messages).__name__}!"
+                )
+        return processed_messages
+
     def _const_kwargs(self, messages: list[dict], stream: bool = False) -> dict:
         kwargs = {"contents": messages, "generation_config": GenerationConfig(temperature=0.3), "stream": stream}
         return kwargs
@@ -88,22 +126,28 @@ class GeminiLLM(BaseLLM):
         self._update_costs(usage)
         return resp
 
-    async def _achat_completion(self, messages: list[dict], timeout: int = 3) -> "AsyncGenerateContentResponse":
+    async def _achat_completion(
+        self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT
+    ) -> "AsyncGenerateContentResponse":
         resp: AsyncGenerateContentResponse = await self.llm.generate_content_async(**self._const_kwargs(messages))
         usage = await self.aget_usage(messages, resp.text)
         self._update_costs(usage)
         return resp
 
-    async def acompletion(self, messages: list[dict], timeout=3) -> dict:
-        return await self._achat_completion(messages, timeout=timeout)
+    async def acompletion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> dict:
+        return await self._achat_completion(messages, timeout=self.get_timeout(timeout))
 
-    async def _achat_completion_stream(self, messages: list[dict], timeout: int = 3) -> str:
+    async def _achat_completion_stream(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> str:
         resp: AsyncGenerateContentResponse = await self.llm.generate_content_async(
             **self._const_kwargs(messages, stream=True)
         )
         collected_content = []
         async for chunk in resp:
-            content = chunk.text
+            try:
+                content = chunk.text
+            except Exception as e:
+                logger.warning(f"messages: {messages}\nerrors: {e}\n{BlockedPromptException(str(chunk))}")
+                raise BlockedPromptException(str(chunk))
             log_llm_stream(content)
             collected_content.append(content)
         log_llm_stream("\n")
@@ -112,3 +156,10 @@ class GeminiLLM(BaseLLM):
         usage = await self.aget_usage(messages, full_content)
         self._update_costs(usage)
         return full_content
+
+    def list_models(self) -> List:
+        models = []
+        for model in genai.list_models(page_size=100):
+            models.append(asdict(model))
+        logger.info(json.dumps(models))
+        return models
diff --git a/metagpt/provider/human_provider.py b/metagpt/provider/human_provider.py
index e5f37c5b9..87dbd105f 100644
--- a/metagpt/provider/human_provider.py
+++ b/metagpt/provider/human_provider.py
@@ -6,6 +6,7 @@ Author: garylin2099
 from typing import Optional
 
 from metagpt.configs.llm_config import LLMConfig
+from metagpt.const import LLM_API_TIMEOUT, USE_CONFIG_TIMEOUT
 from metagpt.logs import logger
 from metagpt.provider.base_llm import BaseLLM
 
@@ -16,9 +17,9 @@ class HumanProvider(BaseLLM):
     """
 
     def __init__(self, config: LLMConfig):
-        pass
+        self.config = config
 
-    def ask(self, msg: str, timeout=3) -> str:
+    def ask(self, msg: str, timeout=USE_CONFIG_TIMEOUT) -> str:
         logger.info("It's your turn, please type in your response. You may also refer to the context below")
         rsp = input(msg)
         if rsp in ["exit", "quit"]:
@@ -31,20 +32,23 @@ class HumanProvider(BaseLLM):
         system_msgs: Optional[list[str]] = None,
         format_msgs: Optional[list[dict[str, str]]] = None,
         generator: bool = False,
-        timeout=3,
+        timeout=USE_CONFIG_TIMEOUT,
     ) -> str:
-        return self.ask(msg, timeout=timeout)
+        return self.ask(msg, timeout=self.get_timeout(timeout))
 
-    async def _achat_completion(self, messages: list[dict], timeout=3):
+    async def _achat_completion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT):
         pass
 
-    async def acompletion(self, messages: list[dict], timeout=3):
+    async def acompletion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT):
         """dummy implementation of abstract method in base"""
         return []
 
-    async def _achat_completion_stream(self, messages: list[dict], timeout: int = 3) -> str:
+    async def _achat_completion_stream(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> str:
         pass
 
-    async def acompletion_text(self, messages: list[dict], stream=False, timeout=3) -> str:
+    async def acompletion_text(self, messages: list[dict], stream=False, timeout=USE_CONFIG_TIMEOUT) -> str:
         """dummy implementation of abstract method in base"""
         return ""
+
+    def get_timeout(self, timeout: int) -> int:
+        return timeout or LLM_API_TIMEOUT
diff --git a/metagpt/provider/ollama_api.py b/metagpt/provider/ollama_api.py
index f65d7e411..2913eb1dd 100644
--- a/metagpt/provider/ollama_api.py
+++ b/metagpt/provider/ollama_api.py
@@ -5,7 +5,7 @@
 import json
 
 from metagpt.configs.llm_config import LLMConfig, LLMType
-from metagpt.const import LLM_API_TIMEOUT
+from metagpt.const import USE_CONFIG_TIMEOUT
 from metagpt.logs import log_llm_stream
 from metagpt.provider.base_llm import BaseLLM
 from metagpt.provider.general_api_requestor import GeneralAPIRequestor
@@ -50,28 +50,28 @@ class OllamaLLM(BaseLLM):
         chunk = chunk.decode(encoding)
         return json.loads(chunk)
 
-    async def _achat_completion(self, messages: list[dict], timeout: int = 3) -> dict:
+    async def _achat_completion(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> dict:
         resp, _, _ = await self.client.arequest(
             method=self.http_method,
             url=self.suffix_url,
             params=self._const_kwargs(messages),
-            request_timeout=LLM_API_TIMEOUT,
+            request_timeout=self.get_timeout(timeout),
         )
         resp = self._decode_and_load(resp)
         usage = self.get_usage(resp)
         self._update_costs(usage)
         return resp
 
-    async def acompletion(self, messages: list[dict], timeout=3) -> dict:
-        return await self._achat_completion(messages, timeout=timeout)
+    async def acompletion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> dict:
+        return await self._achat_completion(messages, timeout=self.get_timeout(timeout))
 
-    async def _achat_completion_stream(self, messages: list[dict], timeout: int = 3) -> str:
+    async def _achat_completion_stream(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> str:
         stream_resp, _, _ = await self.client.arequest(
             method=self.http_method,
             url=self.suffix_url,
             stream=True,
             params=self._const_kwargs(messages, stream=True),
-            request_timeout=LLM_API_TIMEOUT,
+            request_timeout=self.get_timeout(timeout),
         )
 
         collected_content = []
diff --git a/metagpt/provider/openai_api.py b/metagpt/provider/openai_api.py
index e99707ab9..dbfed72df 100644
--- a/metagpt/provider/openai_api.py
+++ b/metagpt/provider/openai_api.py
@@ -25,16 +25,12 @@ from tenacity import (
 )
 
 from metagpt.configs.llm_config import LLMConfig, LLMType
+from metagpt.const import USE_CONFIG_TIMEOUT
 from metagpt.logs import log_llm_stream, logger
 from metagpt.provider.base_llm import BaseLLM
 from metagpt.provider.constant import GENERAL_FUNCTION_SCHEMA
 from metagpt.provider.llm_provider_registry import register_provider
-from metagpt.utils.common import (
-    CodeParser,
-    decode_image,
-    log_and_reraise,
-    process_message,
-)
+from metagpt.utils.common import CodeParser, decode_image, log_and_reraise
 from metagpt.utils.cost_manager import CostManager
 from metagpt.utils.exceptions import handle_exception
 from metagpt.utils.token_counter import (
@@ -44,7 +40,7 @@ from metagpt.utils.token_counter import (
 )
 
 
-@register_provider([LLMType.OPENAI, LLMType.FIREWORKS, LLMType.OPEN_LLM, LLMType.MOONSHOT, LLMType.MISTRAL])
+@register_provider([LLMType.OPENAI, LLMType.FIREWORKS, LLMType.OPEN_LLM, LLMType.MOONSHOT, LLMType.MISTRAL, LLMType.YI])
 class OpenAILLM(BaseLLM):
     """Check https://platform.openai.com/examples for examples"""
 
@@ -79,9 +75,9 @@ class OpenAILLM(BaseLLM):
 
         return params
 
-    async def _achat_completion_stream(self, messages: list[dict], timeout=3) -> str:
+    async def _achat_completion_stream(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> str:
         response: AsyncStream[ChatCompletionChunk] = await self.aclient.chat.completions.create(
-            **self._cons_kwargs(messages, timeout=timeout), stream=True
+            **self._cons_kwargs(messages, timeout=self.get_timeout(timeout)), stream=True
         )
         usage = None
         collected_messages = []
@@ -109,7 +105,7 @@ class OpenAILLM(BaseLLM):
         self._update_costs(usage)
         return full_reply_content
 
-    def _cons_kwargs(self, messages: list[dict], timeout=3, **extra_kwargs) -> dict:
+    def _cons_kwargs(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT, **extra_kwargs) -> dict:
         kwargs = {
             "messages": messages,
             "max_tokens": self._get_max_tokens(messages),
@@ -117,20 +113,20 @@ class OpenAILLM(BaseLLM):
             # "stop": None,  # default it's None and gpt4-v can't have this one
             "temperature": self.config.temperature,
             "model": self.model,
-            "timeout": max(self.config.timeout, timeout),
+            "timeout": self.get_timeout(timeout),
         }
         if extra_kwargs:
             kwargs.update(extra_kwargs)
         return kwargs
 
-    async def _achat_completion(self, messages: list[dict], timeout=3) -> ChatCompletion:
-        kwargs = self._cons_kwargs(messages, timeout=timeout)
+    async def _achat_completion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> ChatCompletion:
+        kwargs = self._cons_kwargs(messages, timeout=self.get_timeout(timeout))
         rsp: ChatCompletion = await self.aclient.chat.completions.create(**kwargs)
         self._update_costs(rsp.usage)
         return rsp
 
-    async def acompletion(self, messages: list[dict], timeout=3) -> ChatCompletion:
-        return await self._achat_completion(messages, timeout=timeout)
+    async def acompletion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> ChatCompletion:
+        return await self._achat_completion(messages, timeout=self.get_timeout(timeout))
 
     @retry(
         wait=wait_random_exponential(min=1, max=60),
@@ -139,24 +135,24 @@ class OpenAILLM(BaseLLM):
         retry=retry_if_exception_type(APIConnectionError),
         retry_error_callback=log_and_reraise,
     )
-    async def acompletion_text(self, messages: list[dict], stream=False, timeout=3) -> str:
+    async def acompletion_text(self, messages: list[dict], stream=False, timeout=USE_CONFIG_TIMEOUT) -> str:
         """when streaming, print each token in place."""
         if stream:
             return await self._achat_completion_stream(messages, timeout=timeout)
 
-        rsp = await self._achat_completion(messages, timeout=timeout)
+        rsp = await self._achat_completion(messages, timeout=self.get_timeout(timeout))
         return self.get_choice_text(rsp)
 
     async def _achat_completion_function(
-        self, messages: list[dict], timeout: int = 3, **chat_configs
+        self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT, **chat_configs
     ) -> ChatCompletion:
-        messages = process_message(messages)
-        kwargs = self._cons_kwargs(messages=messages, timeout=timeout, **chat_configs)
+        messages = self.format_msg(messages)
+        kwargs = self._cons_kwargs(messages=messages, timeout=self.get_timeout(timeout), **chat_configs)
         rsp: ChatCompletion = await self.aclient.chat.completions.create(**kwargs)
         self._update_costs(rsp.usage)
         return rsp
 
-    async def aask_code(self, messages: list[dict], timeout: int = 3, **kwargs) -> dict:
+    async def aask_code(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT, **kwargs) -> dict:
         """Use function of tools to ask a code.
         Note: Keep kwargs consistent with https://platform.openai.com/docs/api-reference/chat/create
 
diff --git a/metagpt/provider/qianfan_api.py b/metagpt/provider/qianfan_api.py
index 50916fa3e..3d78c8bfc 100644
--- a/metagpt/provider/qianfan_api.py
+++ b/metagpt/provider/qianfan_api.py
@@ -9,6 +9,7 @@ from qianfan import ChatCompletion
 from qianfan.resources.typing import JsonBody
 
 from metagpt.configs.llm_config import LLMConfig, LLMType
+from metagpt.const import USE_CONFIG_TIMEOUT
 from metagpt.logs import log_llm_stream
 from metagpt.provider.base_llm import BaseLLM
 from metagpt.provider.llm_provider_registry import register_provider
@@ -107,15 +108,15 @@ class QianFanLLM(BaseLLM):
         self._update_costs(resp.body.get("usage", {}))
         return resp.body
 
-    async def _achat_completion(self, messages: list[dict], timeout: int = 3) -> JsonBody:
+    async def _achat_completion(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> JsonBody:
         resp = await self.aclient.ado(**self._const_kwargs(messages=messages, stream=False))
         self._update_costs(resp.body.get("usage", {}))
         return resp.body
 
-    async def acompletion(self, messages: list[dict], timeout: int = 3) -> JsonBody:
-        return await self._achat_completion(messages, timeout=timeout)
+    async def acompletion(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> JsonBody:
+        return await self._achat_completion(messages, timeout=self.get_timeout(timeout))
 
-    async def _achat_completion_stream(self, messages: list[dict], timeout: int = 3) -> str:
+    async def _achat_completion_stream(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> str:
         resp = await self.aclient.ado(**self._const_kwargs(messages=messages, stream=True))
         collected_content = []
         usage = {}
diff --git a/metagpt/provider/spark_api.py b/metagpt/provider/spark_api.py
index 882c6ce85..594267259 100644
--- a/metagpt/provider/spark_api.py
+++ b/metagpt/provider/spark_api.py
@@ -17,6 +17,7 @@ from wsgiref.handlers import format_date_time
 import websocket  # 使用websocket_client
 
 from metagpt.configs.llm_config import LLMConfig, LLMType
+from metagpt.const import USE_CONFIG_TIMEOUT
 from metagpt.logs import logger
 from metagpt.provider.base_llm import BaseLLM
 from metagpt.provider.llm_provider_registry import register_provider
@@ -31,19 +32,19 @@ class SparkLLM(BaseLLM):
     def get_choice_text(self, rsp: dict) -> str:
         return rsp["payload"]["choices"]["text"][-1]["content"]
 
-    async def _achat_completion_stream(self, messages: list[dict], timeout: int = 3) -> str:
+    async def _achat_completion_stream(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> str:
         pass
 
-    async def acompletion_text(self, messages: list[dict], stream=False, timeout: int = 3) -> str:
+    async def acompletion_text(self, messages: list[dict], stream=False, timeout: int = USE_CONFIG_TIMEOUT) -> str:
         # 不支持
         # logger.warning("当前方法无法支持异步运行。当你使用acompletion时，并不能并行访问。")
         w = GetMessageFromWeb(messages, self.config)
         return w.run()
 
-    async def _achat_completion(self, messages: list[dict], timeout=3):
+    async def _achat_completion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT):
         pass
 
-    async def acompletion(self, messages: list[dict], timeout=3):
+    async def acompletion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT):
         # 不支持异步
         w = GetMessageFromWeb(messages, self.config)
         return w.run()
diff --git a/metagpt/provider/zhipuai_api.py b/metagpt/provider/zhipuai_api.py
index 14ad1a36b..2db441991 100644
--- a/metagpt/provider/zhipuai_api.py
+++ b/metagpt/provider/zhipuai_api.py
@@ -8,6 +8,7 @@ from typing import Optional
 from zhipuai.types.chat.chat_completion import Completion
 
 from metagpt.configs.llm_config import LLMConfig, LLMType
+from metagpt.const import USE_CONFIG_TIMEOUT
 from metagpt.logs import log_llm_stream
 from metagpt.provider.base_llm import BaseLLM
 from metagpt.provider.llm_provider_registry import register_provider
@@ -45,22 +46,22 @@ class ZhiPuAILLM(BaseLLM):
         kwargs = {"model": self.model, "messages": messages, "stream": stream, "temperature": 0.3}
         return kwargs
 
-    def completion(self, messages: list[dict], timeout=3) -> dict:
+    def completion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> dict:
         resp: Completion = self.llm.chat.completions.create(**self._const_kwargs(messages))
         usage = resp.usage.model_dump()
         self._update_costs(usage)
         return resp.model_dump()
 
-    async def _achat_completion(self, messages: list[dict], timeout=3) -> dict:
+    async def _achat_completion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> dict:
         resp = await self.llm.acreate(**self._const_kwargs(messages))
         usage = resp.get("usage", {})
         self._update_costs(usage)
         return resp
 
-    async def acompletion(self, messages: list[dict], timeout=3) -> dict:
-        return await self._achat_completion(messages, timeout=timeout)
+    async def acompletion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> dict:
+        return await self._achat_completion(messages, timeout=self.get_timeout(timeout))
 
-    async def _achat_completion_stream(self, messages: list[dict], timeout=3) -> str:
+    async def _achat_completion_stream(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT) -> str:
         response = await self.llm.acreate_stream(**self._const_kwargs(messages, stream=True))
         collected_content = []
         usage = {}
diff --git a/metagpt/rag/__init__.py b/metagpt/rag/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/metagpt/rag/engines/__init__.py b/metagpt/rag/engines/__init__.py
new file mode 100644
index 000000000..93699db88
--- /dev/null
+++ b/metagpt/rag/engines/__init__.py
@@ -0,0 +1,6 @@
+"""Engines init"""
+
+from metagpt.rag.engines.simple import SimpleEngine
+from metagpt.rag.engines.flare import FLAREEngine
+
+__all__ = ["SimpleEngine", "FLAREEngine"]
diff --git a/metagpt/rag/engines/flare.py b/metagpt/rag/engines/flare.py
new file mode 100644
index 000000000..dc05bd3dd
--- /dev/null
+++ b/metagpt/rag/engines/flare.py
@@ -0,0 +1,9 @@
+"""FLARE Engine.
+
+Use llamaindex's FLAREInstructQueryEngine as FLAREEngine, which accepts other engines as parameters.
+For example, Create a simple engine, and then pass it to FLAREEngine.
+"""
+
+from llama_index.core.query_engine import (  # noqa: F401
+    FLAREInstructQueryEngine as FLAREEngine,
+)
diff --git a/metagpt/rag/engines/simple.py b/metagpt/rag/engines/simple.py
new file mode 100644
index 000000000..5c5810308
--- /dev/null
+++ b/metagpt/rag/engines/simple.py
@@ -0,0 +1,261 @@
+"""Simple Engine."""
+
+import json
+import os
+from typing import Any, Optional, Union
+
+from llama_index.core import SimpleDirectoryReader, VectorStoreIndex
+from llama_index.core.callbacks.base import CallbackManager
+from llama_index.core.embeddings import BaseEmbedding
+from llama_index.core.embeddings.mock_embed_model import MockEmbedding
+from llama_index.core.indices.base import BaseIndex
+from llama_index.core.ingestion.pipeline import run_transformations
+from llama_index.core.llms import LLM
+from llama_index.core.node_parser import SentenceSplitter
+from llama_index.core.postprocessor.types import BaseNodePostprocessor
+from llama_index.core.query_engine import RetrieverQueryEngine
+from llama_index.core.response_synthesizers import (
+    BaseSynthesizer,
+    get_response_synthesizer,
+)
+from llama_index.core.retrievers import BaseRetriever
+from llama_index.core.schema import (
+    BaseNode,
+    Document,
+    NodeWithScore,
+    QueryBundle,
+    QueryType,
+    TransformComponent,
+)
+
+from metagpt.rag.factories import (
+    get_index,
+    get_rag_embedding,
+    get_rag_llm,
+    get_rankers,
+    get_retriever,
+)
+from metagpt.rag.interface import NoEmbedding, RAGObject
+from metagpt.rag.retrievers.base import ModifiableRAGRetriever, PersistableRAGRetriever
+from metagpt.rag.retrievers.hybrid_retriever import SimpleHybridRetriever
+from metagpt.rag.schema import (
+    BaseIndexConfig,
+    BaseRankerConfig,
+    BaseRetrieverConfig,
+    BM25RetrieverConfig,
+    ObjectNode,
+)
+from metagpt.utils.common import import_class
+
+
+class SimpleEngine(RetrieverQueryEngine):
+    """SimpleEngine is designed to be simple and straightforward.
+
+    It is a lightweight and easy-to-use search engine that integrates
+    document reading, embedding, indexing, retrieving, and ranking functionalities
+    into a single, straightforward workflow. It is designed to quickly set up a
+    search engine from a collection of documents.
+    """
+
+    def __init__(
+        self,
+        retriever: BaseRetriever,
+        response_synthesizer: Optional[BaseSynthesizer] = None,
+        node_postprocessors: Optional[list[BaseNodePostprocessor]] = None,
+        callback_manager: Optional[CallbackManager] = None,
+        index: Optional[BaseIndex] = None,
+    ) -> None:
+        super().__init__(
+            retriever=retriever,
+            response_synthesizer=response_synthesizer,
+            node_postprocessors=node_postprocessors,
+            callback_manager=callback_manager,
+        )
+        self.index = index
+
+    @classmethod
+    def from_docs(
+        cls,
+        input_dir: str = None,
+        input_files: list[str] = None,
+        transformations: Optional[list[TransformComponent]] = None,
+        embed_model: BaseEmbedding = None,
+        llm: LLM = None,
+        retriever_configs: list[BaseRetrieverConfig] = None,
+        ranker_configs: list[BaseRankerConfig] = None,
+    ) -> "SimpleEngine":
+        """From docs.
+
+        Must provide either `input_dir` or `input_files`.
+
+        Args:
+            input_dir: Path to the directory.
+            input_files: List of file paths to read (Optional; overrides input_dir, exclude).
+            transformations: Parse documents to nodes. Default [SentenceSplitter].
+            embed_model: Parse nodes to embedding. Must supported by llama index. Default OpenAIEmbedding.
+            llm: Must supported by llama index. Default OpenAI.
+            retriever_configs: Configuration for retrievers. If more than one config, will use SimpleHybridRetriever.
+            ranker_configs: Configuration for rankers.
+        """
+        if not input_dir and not input_files:
+            raise ValueError("Must provide either `input_dir` or `input_files`.")
+
+        documents = SimpleDirectoryReader(input_dir=input_dir, input_files=input_files).load_data()
+        cls._fix_document_metadata(documents)
+
+        index = VectorStoreIndex.from_documents(
+            documents=documents,
+            transformations=transformations or [SentenceSplitter()],
+            embed_model=cls._resolve_embed_model(embed_model, retriever_configs),
+        )
+        return cls._from_index(index, llm=llm, retriever_configs=retriever_configs, ranker_configs=ranker_configs)
+
+    @classmethod
+    def from_objs(
+        cls,
+        objs: Optional[list[RAGObject]] = None,
+        transformations: Optional[list[TransformComponent]] = None,
+        embed_model: BaseEmbedding = None,
+        llm: LLM = None,
+        retriever_configs: list[BaseRetrieverConfig] = None,
+        ranker_configs: list[BaseRankerConfig] = None,
+    ) -> "SimpleEngine":
+        """From objs.
+
+        Args:
+            objs: List of RAGObject.
+            transformations: Parse documents to nodes. Default [SentenceSplitter].
+            embed_model: Parse nodes to embedding. Must supported by llama index. Default OpenAIEmbedding.
+            llm: Must supported by llama index. Default OpenAI.
+            retriever_configs: Configuration for retrievers. If more than one config, will use SimpleHybridRetriever.
+            ranker_configs: Configuration for rankers.
+        """
+        objs = objs or []
+        retriever_configs = retriever_configs or []
+
+        if not objs and any(isinstance(config, BM25RetrieverConfig) for config in retriever_configs):
+            raise ValueError("In BM25RetrieverConfig, Objs must not be empty.")
+
+        nodes = [ObjectNode(text=obj.rag_key(), metadata=ObjectNode.get_obj_metadata(obj)) for obj in objs]
+        index = VectorStoreIndex(
+            nodes=nodes,
+            transformations=transformations or [SentenceSplitter()],
+            embed_model=cls._resolve_embed_model(embed_model, retriever_configs),
+        )
+        return cls._from_index(index, llm=llm, retriever_configs=retriever_configs, ranker_configs=ranker_configs)
+
+    @classmethod
+    def from_index(
+        cls,
+        index_config: BaseIndexConfig,
+        embed_model: BaseEmbedding = None,
+        llm: LLM = None,
+        retriever_configs: list[BaseRetrieverConfig] = None,
+        ranker_configs: list[BaseRankerConfig] = None,
+    ) -> "SimpleEngine":
+        """Load from previously maintained index by self.persist(), index_config contains persis_path."""
+        index = get_index(index_config, embed_model=cls._resolve_embed_model(embed_model, [index_config]))
+        return cls._from_index(index, llm=llm, retriever_configs=retriever_configs, ranker_configs=ranker_configs)
+
+    async def asearch(self, content: str, **kwargs) -> str:
+        """Inplement tools.SearchInterface"""
+        return await self.aquery(content)
+
+    async def aretrieve(self, query: QueryType) -> list[NodeWithScore]:
+        """Allow query to be str."""
+        query_bundle = QueryBundle(query) if isinstance(query, str) else query
+
+        nodes = await super().aretrieve(query_bundle)
+        self._try_reconstruct_obj(nodes)
+        return nodes
+
+    def add_docs(self, input_files: list[str]):
+        """Add docs to retriever. retriever must has add_nodes func."""
+        self._ensure_retriever_modifiable()
+
+        documents = SimpleDirectoryReader(input_files=input_files).load_data()
+        self._fix_document_metadata(documents)
+
+        nodes = run_transformations(documents, transformations=self.index._transformations)
+        self._save_nodes(nodes)
+
+    def add_objs(self, objs: list[RAGObject]):
+        """Adds objects to the retriever, storing each object's original form in metadata for future reference."""
+        self._ensure_retriever_modifiable()
+
+        nodes = [ObjectNode(text=obj.rag_key(), metadata=ObjectNode.get_obj_metadata(obj)) for obj in objs]
+        self._save_nodes(nodes)
+
+    def persist(self, persist_dir: Union[str, os.PathLike], **kwargs):
+        """Persist."""
+        self._ensure_retriever_persistable()
+
+        self._persist(str(persist_dir), **kwargs)
+
+    @classmethod
+    def _from_index(
+        cls,
+        index: BaseIndex,
+        llm: LLM = None,
+        retriever_configs: list[BaseRetrieverConfig] = None,
+        ranker_configs: list[BaseRankerConfig] = None,
+    ) -> "SimpleEngine":
+        llm = llm or get_rag_llm()
+        retriever = get_retriever(configs=retriever_configs, index=index)  # Default index.as_retriever
+        rankers = get_rankers(configs=ranker_configs, llm=llm)  # Default []
+
+        return cls(
+            retriever=retriever,
+            node_postprocessors=rankers,
+            response_synthesizer=get_response_synthesizer(llm=llm),
+            index=index,
+        )
+
+    def _ensure_retriever_modifiable(self):
+        self._ensure_retriever_of_type(ModifiableRAGRetriever)
+
+    def _ensure_retriever_persistable(self):
+        self._ensure_retriever_of_type(PersistableRAGRetriever)
+
+    def _ensure_retriever_of_type(self, required_type: BaseRetriever):
+        """Ensure that self.retriever is required_type, or at least one of its components, if it's a SimpleHybridRetriever.
+
+        Args:
+            required_type: The class that the retriever is expected to be an instance of.
+        """
+        if isinstance(self.retriever, SimpleHybridRetriever):
+            if not any(isinstance(r, required_type) for r in self.retriever.retrievers):
+                raise TypeError(
+                    f"Must have at least one retriever of type {required_type.__name__} in SimpleHybridRetriever"
+                )
+
+        if not isinstance(self.retriever, required_type):
+            raise TypeError(f"The retriever is not of type {required_type.__name__}: {type(self.retriever)}")
+
+    def _save_nodes(self, nodes: list[BaseNode]):
+        self.retriever.add_nodes(nodes)
+
+    def _persist(self, persist_dir: str, **kwargs):
+        self.retriever.persist(persist_dir, **kwargs)
+
+    @staticmethod
+    def _try_reconstruct_obj(nodes: list[NodeWithScore]):
+        """If node is object, then dynamically reconstruct object, and save object to node.metadata["obj"]."""
+        for node in nodes:
+            if node.metadata.get("is_obj", False):
+                obj_cls = import_class(node.metadata["obj_cls_name"], node.metadata["obj_mod_name"])
+                obj_dict = json.loads(node.metadata["obj_json"])
+                node.metadata["obj"] = obj_cls(**obj_dict)
+
+    @staticmethod
+    def _fix_document_metadata(documents: list[Document]):
+        """LlamaIndex keep metadata['file_path'], which is unnecessary, maybe deleted in the near future."""
+        for doc in documents:
+            doc.excluded_embed_metadata_keys.append("file_path")
+
+    @staticmethod
+    def _resolve_embed_model(embed_model: BaseEmbedding = None, configs: list[Any] = None) -> BaseEmbedding:
+        if configs and all(isinstance(c, NoEmbedding) for c in configs):
+            return MockEmbedding(embed_dim=1)
+
+        return embed_model or get_rag_embedding()
diff --git a/metagpt/rag/factories/__init__.py b/metagpt/rag/factories/__init__.py
new file mode 100644
index 000000000..caa35405f
--- /dev/null
+++ b/metagpt/rag/factories/__init__.py
@@ -0,0 +1,9 @@
+"""RAG factories"""
+
+from metagpt.rag.factories.retriever import get_retriever
+from metagpt.rag.factories.ranker import get_rankers
+from metagpt.rag.factories.embedding import get_rag_embedding
+from metagpt.rag.factories.index import get_index
+from metagpt.rag.factories.llm import get_rag_llm
+
+__all__ = ["get_retriever", "get_rankers", "get_rag_embedding", "get_index", "get_rag_llm"]
diff --git a/metagpt/rag/factories/base.py b/metagpt/rag/factories/base.py
new file mode 100644
index 000000000..fbdfbf1a8
--- /dev/null
+++ b/metagpt/rag/factories/base.py
@@ -0,0 +1,59 @@
+"""Base Factory."""
+
+from typing import Any, Callable
+
+
+class GenericFactory:
+    """Designed to get objects based on any keys."""
+
+    def __init__(self, creators: dict[Any, Callable] = None):
+        """Creators is a dictionary.
+
+        Keys are identifiers, and the values are the associated creator function, which create objects.
+        """
+        self._creators = creators or {}
+
+    def get_instances(self, keys: list[Any], **kwargs) -> list[Any]:
+        """Get instances by keys."""
+        return [self.get_instance(key, **kwargs) for key in keys]
+
+    def get_instance(self, key: Any, **kwargs) -> Any:
+        """Get instance by key.
+
+        Raise Exception if key not found.
+        """
+        creator = self._creators.get(key)
+        if creator:
+            return creator(**kwargs)
+
+        raise ValueError(f"Creator not registered for key: {key}")
+
+
+class ConfigBasedFactory(GenericFactory):
+    """Designed to get objects based on object type."""
+
+    def get_instance(self, key: Any, **kwargs) -> Any:
+        """Key is config, such as a pydantic model.
+
+        Call func by the type of key, and the key will be passed to func.
+        """
+        creator = self._creators.get(type(key))
+        if creator:
+            return creator(key, **kwargs)
+
+        raise ValueError(f"Unknown config: `{type(key)}`, {key}")
+
+    @staticmethod
+    def _val_from_config_or_kwargs(key: str, config: object = None, **kwargs) -> Any:
+        """It prioritizes the configuration object's value unless it is None, in which case it looks into kwargs."""
+        if config is not None and hasattr(config, key):
+            val = getattr(config, key)
+            if val is not None:
+                return val
+
+        if key in kwargs:
+            return kwargs[key]
+
+        raise KeyError(
+            f"The key '{key}' is required but not provided in either configuration object or keyword arguments."
+        )
diff --git a/metagpt/rag/factories/embedding.py b/metagpt/rag/factories/embedding.py
new file mode 100644
index 000000000..4247db256
--- /dev/null
+++ b/metagpt/rag/factories/embedding.py
@@ -0,0 +1,37 @@
+"""RAG Embedding Factory."""
+
+from llama_index.core.embeddings import BaseEmbedding
+from llama_index.embeddings.azure_openai import AzureOpenAIEmbedding
+from llama_index.embeddings.openai import OpenAIEmbedding
+
+from metagpt.config2 import config
+from metagpt.configs.llm_config import LLMType
+from metagpt.rag.factories.base import GenericFactory
+
+
+class RAGEmbeddingFactory(GenericFactory):
+    """Create LlamaIndex Embedding with MetaGPT's config."""
+
+    def __init__(self):
+        creators = {
+            LLMType.OPENAI: self._create_openai,
+            LLMType.AZURE: self._create_azure,
+        }
+        super().__init__(creators)
+
+    def get_rag_embedding(self, key: LLMType = None) -> BaseEmbedding:
+        """Key is LLMType, default use config.llm.api_type."""
+        return super().get_instance(key or config.llm.api_type)
+
+    def _create_openai(self):
+        return OpenAIEmbedding(api_key=config.llm.api_key, api_base=config.llm.base_url)
+
+    def _create_azure(self):
+        return AzureOpenAIEmbedding(
+            azure_endpoint=config.llm.base_url,
+            api_key=config.llm.api_key,
+            api_version=config.llm.api_version,
+        )
+
+
+get_rag_embedding = RAGEmbeddingFactory().get_rag_embedding
diff --git a/metagpt/rag/factories/index.py b/metagpt/rag/factories/index.py
new file mode 100644
index 000000000..a56471359
--- /dev/null
+++ b/metagpt/rag/factories/index.py
@@ -0,0 +1,82 @@
+"""RAG Index Factory."""
+
+import chromadb
+from llama_index.core import StorageContext, VectorStoreIndex, load_index_from_storage
+from llama_index.core.embeddings import BaseEmbedding
+from llama_index.core.indices.base import BaseIndex
+from llama_index.core.vector_stores.types import BasePydanticVectorStore
+from llama_index.vector_stores.chroma import ChromaVectorStore
+from llama_index.vector_stores.elasticsearch import ElasticsearchStore
+from llama_index.vector_stores.faiss import FaissVectorStore
+
+from metagpt.rag.factories.base import ConfigBasedFactory
+from metagpt.rag.schema import (
+    BaseIndexConfig,
+    BM25IndexConfig,
+    ChromaIndexConfig,
+    ElasticsearchIndexConfig,
+    ElasticsearchKeywordIndexConfig,
+    FAISSIndexConfig,
+)
+
+
+class RAGIndexFactory(ConfigBasedFactory):
+    def __init__(self):
+        creators = {
+            FAISSIndexConfig: self._create_faiss,
+            ChromaIndexConfig: self._create_chroma,
+            BM25IndexConfig: self._create_bm25,
+            ElasticsearchIndexConfig: self._create_es,
+            ElasticsearchKeywordIndexConfig: self._create_es,
+        }
+        super().__init__(creators)
+
+    def get_index(self, config: BaseIndexConfig, **kwargs) -> BaseIndex:
+        """Key is PersistType."""
+        return super().get_instance(config, **kwargs)
+
+    def _create_faiss(self, config: FAISSIndexConfig, **kwargs) -> VectorStoreIndex:
+        vector_store = FaissVectorStore.from_persist_dir(str(config.persist_path))
+        storage_context = StorageContext.from_defaults(vector_store=vector_store, persist_dir=config.persist_path)
+
+        return self._index_from_storage(storage_context=storage_context, config=config, **kwargs)
+
+    def _create_bm25(self, config: BM25IndexConfig, **kwargs) -> VectorStoreIndex:
+        storage_context = StorageContext.from_defaults(persist_dir=config.persist_path)
+
+        return self._index_from_storage(storage_context=storage_context, config=config, **kwargs)
+
+    def _create_chroma(self, config: ChromaIndexConfig, **kwargs) -> VectorStoreIndex:
+        db = chromadb.PersistentClient(str(config.persist_path))
+        chroma_collection = db.get_or_create_collection(config.collection_name)
+        vector_store = ChromaVectorStore(chroma_collection=chroma_collection)
+
+        return self._index_from_vector_store(vector_store=vector_store, config=config, **kwargs)
+
+    def _create_es(self, config: ElasticsearchIndexConfig, **kwargs) -> VectorStoreIndex:
+        vector_store = ElasticsearchStore(**config.store_config.model_dump())
+
+        return self._index_from_vector_store(vector_store=vector_store, config=config, **kwargs)
+
+    def _index_from_storage(
+        self, storage_context: StorageContext, config: BaseIndexConfig, **kwargs
+    ) -> VectorStoreIndex:
+        embed_model = self._extract_embed_model(config, **kwargs)
+
+        return load_index_from_storage(storage_context=storage_context, embed_model=embed_model)
+
+    def _index_from_vector_store(
+        self, vector_store: BasePydanticVectorStore, config: BaseIndexConfig, **kwargs
+    ) -> VectorStoreIndex:
+        embed_model = self._extract_embed_model(config, **kwargs)
+
+        return VectorStoreIndex.from_vector_store(
+            vector_store=vector_store,
+            embed_model=embed_model,
+        )
+
+    def _extract_embed_model(self, config, **kwargs) -> BaseEmbedding:
+        return self._val_from_config_or_kwargs("embed_model", config, **kwargs)
+
+
+get_index = RAGIndexFactory().get_index
diff --git a/metagpt/rag/factories/llm.py b/metagpt/rag/factories/llm.py
new file mode 100644
index 000000000..17c499b76
--- /dev/null
+++ b/metagpt/rag/factories/llm.py
@@ -0,0 +1,56 @@
+"""RAG LLM."""
+
+from typing import Any
+
+from llama_index.core.constants import DEFAULT_CONTEXT_WINDOW
+from llama_index.core.llms import (
+    CompletionResponse,
+    CompletionResponseGen,
+    CustomLLM,
+    LLMMetadata,
+)
+from llama_index.core.llms.callbacks import llm_completion_callback
+from pydantic import Field
+
+from metagpt.config2 import config
+from metagpt.llm import LLM
+from metagpt.provider.base_llm import BaseLLM
+from metagpt.utils.async_helper import run_coroutine_in_new_loop
+from metagpt.utils.token_counter import TOKEN_MAX
+
+
+class RAGLLM(CustomLLM):
+    """LlamaIndex's LLM is different from MetaGPT's LLM.
+
+    Inherit CustomLLM from llamaindex, making MetaGPT's LLM can be used by LlamaIndex.
+    """
+
+    model_infer: BaseLLM = Field(..., description="The MetaGPT's LLM.")
+    context_window: int = TOKEN_MAX.get(config.llm.model, DEFAULT_CONTEXT_WINDOW)
+    num_output: int = config.llm.max_token
+    model_name: str = config.llm.model
+
+    @property
+    def metadata(self) -> LLMMetadata:
+        """Get LLM metadata."""
+        return LLMMetadata(
+            context_window=self.context_window, num_output=self.num_output, model_name=self.model_name or "unknown"
+        )
+
+    @llm_completion_callback()
+    def complete(self, prompt: str, **kwargs: Any) -> CompletionResponse:
+        return run_coroutine_in_new_loop(self.acomplete(prompt, **kwargs))
+
+    @llm_completion_callback()
+    async def acomplete(self, prompt: str, formatted: bool = False, **kwargs: Any) -> CompletionResponse:
+        text = await self.model_infer.aask(msg=prompt, stream=False)
+        return CompletionResponse(text=text)
+
+    @llm_completion_callback()
+    def stream_complete(self, prompt: str, **kwargs: Any) -> CompletionResponseGen:
+        ...
+
+
+def get_rag_llm(model_infer: BaseLLM = None) -> RAGLLM:
+    """Get llm that can be used by LlamaIndex."""
+    return RAGLLM(model_infer=model_infer or LLM())
diff --git a/metagpt/rag/factories/ranker.py b/metagpt/rag/factories/ranker.py
new file mode 100644
index 000000000..476fe8c1a
--- /dev/null
+++ b/metagpt/rag/factories/ranker.py
@@ -0,0 +1,55 @@
+"""RAG Ranker Factory."""
+
+from llama_index.core.llms import LLM
+from llama_index.core.postprocessor import LLMRerank
+from llama_index.core.postprocessor.types import BaseNodePostprocessor
+
+from metagpt.rag.factories.base import ConfigBasedFactory
+from metagpt.rag.rankers.object_ranker import ObjectSortPostprocessor
+from metagpt.rag.schema import (
+    BaseRankerConfig,
+    ColbertRerankConfig,
+    LLMRankerConfig,
+    ObjectRankerConfig,
+)
+
+
+class RankerFactory(ConfigBasedFactory):
+    """Modify creators for dynamically instance implementation."""
+
+    def __init__(self):
+        creators = {
+            LLMRankerConfig: self._create_llm_ranker,
+            ColbertRerankConfig: self._create_colbert_ranker,
+            ObjectRankerConfig: self._create_object_ranker,
+        }
+        super().__init__(creators)
+
+    def get_rankers(self, configs: list[BaseRankerConfig] = None, **kwargs) -> list[BaseNodePostprocessor]:
+        """Creates and returns a retriever instance based on the provided configurations."""
+        if not configs:
+            return []
+
+        return super().get_instances(configs, **kwargs)
+
+    def _create_llm_ranker(self, config: LLMRankerConfig, **kwargs) -> LLMRerank:
+        config.llm = self._extract_llm(config, **kwargs)
+        return LLMRerank(**config.model_dump())
+
+    def _create_colbert_ranker(self, config: ColbertRerankConfig, **kwargs) -> LLMRerank:
+        try:
+            from llama_index.postprocessor.colbert_rerank import ColbertRerank
+        except ImportError:
+            raise ImportError(
+                "`llama-index-postprocessor-colbert-rerank` package not found, please run `pip install llama-index-postprocessor-colbert-rerank`"
+            )
+        return ColbertRerank(**config.model_dump())
+
+    def _create_object_ranker(self, config: ObjectRankerConfig, **kwargs) -> LLMRerank:
+        return ObjectSortPostprocessor(**config.model_dump())
+
+    def _extract_llm(self, config: BaseRankerConfig = None, **kwargs) -> LLM:
+        return self._val_from_config_or_kwargs("llm", config, **kwargs)
+
+
+get_rankers = RankerFactory().get_rankers
diff --git a/metagpt/rag/factories/retriever.py b/metagpt/rag/factories/retriever.py
new file mode 100644
index 000000000..65729002e
--- /dev/null
+++ b/metagpt/rag/factories/retriever.py
@@ -0,0 +1,101 @@
+"""RAG Retriever Factory."""
+
+import copy
+
+import chromadb
+import faiss
+from llama_index.core import StorageContext, VectorStoreIndex
+from llama_index.core.vector_stores.types import BasePydanticVectorStore
+from llama_index.vector_stores.chroma import ChromaVectorStore
+from llama_index.vector_stores.elasticsearch import ElasticsearchStore
+from llama_index.vector_stores.faiss import FaissVectorStore
+
+from metagpt.rag.factories.base import ConfigBasedFactory
+from metagpt.rag.retrievers.base import RAGRetriever
+from metagpt.rag.retrievers.bm25_retriever import DynamicBM25Retriever
+from metagpt.rag.retrievers.chroma_retriever import ChromaRetriever
+from metagpt.rag.retrievers.es_retriever import ElasticsearchRetriever
+from metagpt.rag.retrievers.faiss_retriever import FAISSRetriever
+from metagpt.rag.retrievers.hybrid_retriever import SimpleHybridRetriever
+from metagpt.rag.schema import (
+    BaseRetrieverConfig,
+    BM25RetrieverConfig,
+    ChromaRetrieverConfig,
+    ElasticsearchKeywordRetrieverConfig,
+    ElasticsearchRetrieverConfig,
+    FAISSRetrieverConfig,
+    IndexRetrieverConfig,
+)
+
+
+class RetrieverFactory(ConfigBasedFactory):
+    """Modify creators for dynamically instance implementation."""
+
+    def __init__(self):
+        creators = {
+            FAISSRetrieverConfig: self._create_faiss_retriever,
+            BM25RetrieverConfig: self._create_bm25_retriever,
+            ChromaRetrieverConfig: self._create_chroma_retriever,
+            ElasticsearchRetrieverConfig: self._create_es_retriever,
+            ElasticsearchKeywordRetrieverConfig: self._create_es_retriever,
+        }
+        super().__init__(creators)
+
+    def get_retriever(self, configs: list[BaseRetrieverConfig] = None, **kwargs) -> RAGRetriever:
+        """Creates and returns a retriever instance based on the provided configurations.
+
+        If multiple retrievers, using SimpleHybridRetriever.
+        """
+        if not configs:
+            return self._create_default(**kwargs)
+
+        retrievers = super().get_instances(configs, **kwargs)
+
+        return SimpleHybridRetriever(*retrievers) if len(retrievers) > 1 else retrievers[0]
+
+    def _create_default(self, **kwargs) -> RAGRetriever:
+        return self._extract_index(**kwargs).as_retriever()
+
+    def _create_faiss_retriever(self, config: FAISSRetrieverConfig, **kwargs) -> FAISSRetriever:
+        vector_store = FaissVectorStore(faiss_index=faiss.IndexFlatL2(config.dimensions))
+        config.index = self._build_index_from_vector_store(config, vector_store, **kwargs)
+
+        return FAISSRetriever(**config.model_dump())
+
+    def _create_bm25_retriever(self, config: BM25RetrieverConfig, **kwargs) -> DynamicBM25Retriever:
+        config.index = copy.deepcopy(self._extract_index(config, **kwargs))
+
+        return DynamicBM25Retriever(nodes=list(config.index.docstore.docs.values()), **config.model_dump())
+
+    def _create_chroma_retriever(self, config: ChromaRetrieverConfig, **kwargs) -> ChromaRetriever:
+        db = chromadb.PersistentClient(path=str(config.persist_path))
+        chroma_collection = db.get_or_create_collection(config.collection_name)
+
+        vector_store = ChromaVectorStore(chroma_collection=chroma_collection)
+        config.index = self._build_index_from_vector_store(config, vector_store, **kwargs)
+
+        return ChromaRetriever(**config.model_dump())
+
+    def _create_es_retriever(self, config: ElasticsearchRetrieverConfig, **kwargs) -> ElasticsearchRetriever:
+        vector_store = ElasticsearchStore(**config.store_config.model_dump())
+        config.index = self._build_index_from_vector_store(config, vector_store, **kwargs)
+
+        return ElasticsearchRetriever(**config.model_dump())
+
+    def _extract_index(self, config: BaseRetrieverConfig = None, **kwargs) -> VectorStoreIndex:
+        return self._val_from_config_or_kwargs("index", config, **kwargs)
+
+    def _build_index_from_vector_store(
+        self, config: IndexRetrieverConfig, vector_store: BasePydanticVectorStore, **kwargs
+    ) -> VectorStoreIndex:
+        storage_context = StorageContext.from_defaults(vector_store=vector_store)
+        old_index = self._extract_index(config, **kwargs)
+        new_index = VectorStoreIndex(
+            nodes=list(old_index.docstore.docs.values()),
+            storage_context=storage_context,
+            embed_model=old_index._embed_model,
+        )
+        return new_index
+
+
+get_retriever = RetrieverFactory().get_retriever
diff --git a/metagpt/rag/interface.py b/metagpt/rag/interface.py
new file mode 100644
index 000000000..867605edc
--- /dev/null
+++ b/metagpt/rag/interface.py
@@ -0,0 +1,24 @@
+"""RAG Interfaces."""
+
+from typing import Protocol, runtime_checkable
+
+
+@runtime_checkable
+class RAGObject(Protocol):
+    """Support rag add object."""
+
+    def rag_key(self) -> str:
+        """For rag search."""
+
+    def model_dump_json(self) -> str:
+        """For rag persist.
+
+        Pydantic Model don't need to implement this, as there is a built-in function named model_dump_json.
+        """
+
+
+@runtime_checkable
+class NoEmbedding(Protocol):
+    """Some retriever does not require embeddings, e.g. BM25"""
+
+    _no_embedding: bool
diff --git a/metagpt/rag/rankers/__init__.py b/metagpt/rag/rankers/__init__.py
new file mode 100644
index 000000000..82743487c
--- /dev/null
+++ b/metagpt/rag/rankers/__init__.py
@@ -0,0 +1 @@
+"""Rankers init"""
diff --git a/metagpt/rag/rankers/base.py b/metagpt/rag/rankers/base.py
new file mode 100644
index 000000000..a533a8b90
--- /dev/null
+++ b/metagpt/rag/rankers/base.py
@@ -0,0 +1,19 @@
+"""Base Ranker."""
+
+from abc import abstractmethod
+from typing import Optional
+
+from llama_index.core.postprocessor.types import BaseNodePostprocessor
+from llama_index.core.schema import NodeWithScore, QueryBundle
+
+
+class RAGRanker(BaseNodePostprocessor):
+    """inherit from llama_index"""
+
+    @abstractmethod
+    def _postprocess_nodes(
+        self,
+        nodes: list[NodeWithScore],
+        query_bundle: Optional[QueryBundle] = None,
+    ) -> list[NodeWithScore]:
+        """postprocess nodes."""
diff --git a/metagpt/rag/rankers/object_ranker.py b/metagpt/rag/rankers/object_ranker.py
new file mode 100644
index 000000000..b8456803f
--- /dev/null
+++ b/metagpt/rag/rankers/object_ranker.py
@@ -0,0 +1,55 @@
+"""Object ranker."""
+
+import heapq
+import json
+from typing import Literal, Optional
+
+from llama_index.core.postprocessor.types import BaseNodePostprocessor
+from llama_index.core.schema import NodeWithScore, QueryBundle
+from pydantic import Field
+
+from metagpt.rag.schema import ObjectNode
+
+
+class ObjectSortPostprocessor(BaseNodePostprocessor):
+    """Sorted by object's field, desc or asc.
+
+    Assumes nodes is list of ObjectNode with score.
+    """
+
+    field_name: str = Field(..., description="field name of the object, field's value must can be compared.")
+    order: Literal["desc", "asc"] = Field(default="desc", description="the direction of order.")
+    top_n: int = 5
+
+    @classmethod
+    def class_name(cls) -> str:
+        return "ObjectSortPostprocessor"
+
+    def _postprocess_nodes(
+        self,
+        nodes: list[NodeWithScore],
+        query_bundle: Optional[QueryBundle] = None,
+    ) -> list[NodeWithScore]:
+        """Postprocess nodes."""
+        if query_bundle is None:
+            raise ValueError("Missing query bundle in extra info.")
+
+        if not nodes:
+            return []
+
+        self._check_metadata(nodes[0].node)
+
+        sort_key = lambda node: json.loads(node.node.metadata["obj_json"])[self.field_name]
+        return self._get_sort_func()(self.top_n, nodes, key=sort_key)
+
+    def _check_metadata(self, node: ObjectNode):
+        try:
+            obj_dict = json.loads(node.metadata.get("obj_json"))
+        except Exception as e:
+            raise ValueError(f"Invalid object json in metadata: {node.metadata}, error: {e}")
+
+        if self.field_name not in obj_dict:
+            raise ValueError(f"Field '{self.field_name}' not found in object: {obj_dict}")
+
+    def _get_sort_func(self):
+        return heapq.nlargest if self.order == "desc" else heapq.nsmallest
diff --git a/metagpt/rag/retrievers/__init__.py b/metagpt/rag/retrievers/__init__.py
new file mode 100644
index 000000000..2f70e0328
--- /dev/null
+++ b/metagpt/rag/retrievers/__init__.py
@@ -0,0 +1,5 @@
+"""Retrievers init."""
+
+from metagpt.rag.retrievers.hybrid_retriever import SimpleHybridRetriever
+
+__all__ = ["SimpleHybridRetriever"]
diff --git a/metagpt/rag/retrievers/base.py b/metagpt/rag/retrievers/base.py
new file mode 100644
index 000000000..a7b836833
--- /dev/null
+++ b/metagpt/rag/retrievers/base.py
@@ -0,0 +1,47 @@
+"""Base retriever."""
+
+from abc import abstractmethod
+
+from llama_index.core.retrievers import BaseRetriever
+from llama_index.core.schema import BaseNode, NodeWithScore, QueryType
+
+from metagpt.utils.reflection import check_methods
+
+
+class RAGRetriever(BaseRetriever):
+    """Inherit from llama_index"""
+
+    @abstractmethod
+    async def _aretrieve(self, query: QueryType) -> list[NodeWithScore]:
+        """Retrieve nodes"""
+
+    def _retrieve(self, query: QueryType) -> list[NodeWithScore]:
+        """Retrieve nodes"""
+
+
+class ModifiableRAGRetriever(RAGRetriever):
+    """Support modification."""
+
+    @classmethod
+    def __subclasshook__(cls, C):
+        if cls is ModifiableRAGRetriever:
+            return check_methods(C, "add_nodes")
+        return NotImplemented
+
+    @abstractmethod
+    def add_nodes(self, nodes: list[BaseNode], **kwargs) -> None:
+        """To support add docs, must inplement this func"""
+
+
+class PersistableRAGRetriever(RAGRetriever):
+    """Support persistent."""
+
+    @classmethod
+    def __subclasshook__(cls, C):
+        if cls is PersistableRAGRetriever:
+            return check_methods(C, "persist")
+        return NotImplemented
+
+    @abstractmethod
+    def persist(self, persist_dir: str, **kwargs) -> None:
+        """To support persist, must inplement this func"""
diff --git a/metagpt/rag/retrievers/bm25_retriever.py b/metagpt/rag/retrievers/bm25_retriever.py
new file mode 100644
index 000000000..241820cf4
--- /dev/null
+++ b/metagpt/rag/retrievers/bm25_retriever.py
@@ -0,0 +1,47 @@
+"""BM25 retriever."""
+from typing import Callable, Optional
+
+from llama_index.core import VectorStoreIndex
+from llama_index.core.callbacks.base import CallbackManager
+from llama_index.core.constants import DEFAULT_SIMILARITY_TOP_K
+from llama_index.core.schema import BaseNode, IndexNode
+from llama_index.retrievers.bm25 import BM25Retriever
+from rank_bm25 import BM25Okapi
+
+
+class DynamicBM25Retriever(BM25Retriever):
+    """BM25 retriever."""
+
+    def __init__(
+        self,
+        nodes: list[BaseNode],
+        tokenizer: Optional[Callable[[str], list[str]]] = None,
+        similarity_top_k: int = DEFAULT_SIMILARITY_TOP_K,
+        callback_manager: Optional[CallbackManager] = None,
+        objects: Optional[list[IndexNode]] = None,
+        object_map: Optional[dict] = None,
+        verbose: bool = False,
+        index: VectorStoreIndex = None,
+    ) -> None:
+        super().__init__(
+            nodes=nodes,
+            tokenizer=tokenizer,
+            similarity_top_k=similarity_top_k,
+            callback_manager=callback_manager,
+            object_map=object_map,
+            objects=objects,
+            verbose=verbose,
+        )
+        self._index = index
+
+    def add_nodes(self, nodes: list[BaseNode], **kwargs) -> None:
+        """Support add nodes."""
+        self._nodes.extend(nodes)
+        self._corpus = [self._tokenizer(node.get_content()) for node in self._nodes]
+        self.bm25 = BM25Okapi(self._corpus)
+
+        self._index.insert_nodes(nodes, **kwargs)
+
+    def persist(self, persist_dir: str, **kwargs) -> None:
+        """Support persist."""
+        self._index.storage_context.persist(persist_dir)
diff --git a/metagpt/rag/retrievers/chroma_retriever.py b/metagpt/rag/retrievers/chroma_retriever.py
new file mode 100644
index 000000000..d41f375e4
--- /dev/null
+++ b/metagpt/rag/retrievers/chroma_retriever.py
@@ -0,0 +1,17 @@
+"""Chroma retriever."""
+
+from llama_index.core.retrievers import VectorIndexRetriever
+from llama_index.core.schema import BaseNode
+
+
+class ChromaRetriever(VectorIndexRetriever):
+    """Chroma retriever."""
+
+    def add_nodes(self, nodes: list[BaseNode], **kwargs) -> None:
+        """Support add nodes."""
+        self._index.insert_nodes(nodes, **kwargs)
+
+    def persist(self, persist_dir: str, **kwargs) -> None:
+        """Support persist.
+
+        Chromadb automatically saves, so there is no need to implement."""
diff --git a/metagpt/rag/retrievers/es_retriever.py b/metagpt/rag/retrievers/es_retriever.py
new file mode 100644
index 000000000..a1a0a6138
--- /dev/null
+++ b/metagpt/rag/retrievers/es_retriever.py
@@ -0,0 +1,17 @@
+"""Elasticsearch retriever."""
+
+from llama_index.core.retrievers import VectorIndexRetriever
+from llama_index.core.schema import BaseNode
+
+
+class ElasticsearchRetriever(VectorIndexRetriever):
+    """Elasticsearch retriever."""
+
+    def add_nodes(self, nodes: list[BaseNode], **kwargs) -> None:
+        """Support add nodes."""
+        self._index.insert_nodes(nodes, **kwargs)
+
+    def persist(self, persist_dir: str, **kwargs) -> None:
+        """Support persist.
+
+        Elasticsearch automatically saves, so there is no need to implement."""
diff --git a/metagpt/rag/retrievers/faiss_retriever.py b/metagpt/rag/retrievers/faiss_retriever.py
new file mode 100644
index 000000000..80b409292
--- /dev/null
+++ b/metagpt/rag/retrievers/faiss_retriever.py
@@ -0,0 +1,16 @@
+"""FAISS retriever."""
+
+from llama_index.core.retrievers import VectorIndexRetriever
+from llama_index.core.schema import BaseNode
+
+
+class FAISSRetriever(VectorIndexRetriever):
+    """FAISS retriever."""
+
+    def add_nodes(self, nodes: list[BaseNode], **kwargs) -> None:
+        """Support add nodes."""
+        self._index.insert_nodes(nodes, **kwargs)
+
+    def persist(self, persist_dir: str, **kwargs) -> None:
+        """Support persist."""
+        self._index.storage_context.persist(persist_dir)
diff --git a/metagpt/rag/retrievers/hybrid_retriever.py b/metagpt/rag/retrievers/hybrid_retriever.py
new file mode 100644
index 000000000..c725bfc20
--- /dev/null
+++ b/metagpt/rag/retrievers/hybrid_retriever.py
@@ -0,0 +1,48 @@
+"""Hybrid retriever."""
+
+import copy
+
+from llama_index.core.schema import BaseNode, QueryType
+
+from metagpt.rag.retrievers.base import RAGRetriever
+
+
+class SimpleHybridRetriever(RAGRetriever):
+    """A composite retriever that aggregates search results from multiple retrievers."""
+
+    def __init__(self, *retrievers):
+        self.retrievers: list[RAGRetriever] = retrievers
+        super().__init__()
+
+    async def _aretrieve(self, query: QueryType, **kwargs):
+        """Asynchronously retrieves and aggregates search results from all configured retrievers.
+
+        This method queries each retriever in the `retrievers` list with the given query and
+        additional keyword arguments. It then combines the results, ensuring that each node is
+        unique, based on the node's ID.
+        """
+        all_nodes = []
+        for retriever in self.retrievers:
+            # Prevent retriever changing query
+            query_copy = copy.deepcopy(query)
+            nodes = await retriever.aretrieve(query_copy, **kwargs)
+            all_nodes.extend(nodes)
+
+        # combine all nodes
+        result = []
+        node_ids = set()
+        for n in all_nodes:
+            if n.node.node_id not in node_ids:
+                result.append(n)
+                node_ids.add(n.node.node_id)
+        return result
+
+    def add_nodes(self, nodes: list[BaseNode]) -> None:
+        """Support add nodes."""
+        for r in self.retrievers:
+            r.add_nodes(nodes)
+
+    def persist(self, persist_dir: str, **kwargs) -> None:
+        """Support persist."""
+        for r in self.retrievers:
+            r.persist(persist_dir, **kwargs)
diff --git a/metagpt/rag/schema.py b/metagpt/rag/schema.py
new file mode 100644
index 000000000..183f6e0c7
--- /dev/null
+++ b/metagpt/rag/schema.py
@@ -0,0 +1,178 @@
+"""RAG schemas."""
+
+from pathlib import Path
+from typing import Any, Literal, Union
+
+from llama_index.core.embeddings import BaseEmbedding
+from llama_index.core.indices.base import BaseIndex
+from llama_index.core.schema import TextNode
+from llama_index.core.vector_stores.types import VectorStoreQueryMode
+from pydantic import BaseModel, ConfigDict, Field, PrivateAttr
+
+from metagpt.rag.interface import RAGObject
+
+
+class BaseRetrieverConfig(BaseModel):
+    """Common config for retrievers.
+
+    If add new subconfig, it is necessary to add the corresponding instance implementation in rag.factories.retriever.
+    """
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+    similarity_top_k: int = Field(default=5, description="Number of top-k similar results to return during retrieval.")
+
+
+class IndexRetrieverConfig(BaseRetrieverConfig):
+    """Config for Index-basd retrievers."""
+
+    index: BaseIndex = Field(default=None, description="Index for retriver.")
+
+
+class FAISSRetrieverConfig(IndexRetrieverConfig):
+    """Config for FAISS-based retrievers."""
+
+    dimensions: int = Field(default=1536, description="Dimensionality of the vectors for FAISS index construction.")
+
+
+class BM25RetrieverConfig(IndexRetrieverConfig):
+    """Config for BM25-based retrievers."""
+
+    _no_embedding: bool = PrivateAttr(default=True)
+
+
+class ChromaRetrieverConfig(IndexRetrieverConfig):
+    """Config for Chroma-based retrievers."""
+
+    persist_path: Union[str, Path] = Field(default="./chroma_db", description="The directory to save data.")
+    collection_name: str = Field(default="metagpt", description="The name of the collection.")
+
+
+class ElasticsearchStoreConfig(BaseModel):
+    index_name: str = Field(default="metagpt", description="Name of the Elasticsearch index.")
+    es_url: str = Field(default=None, description="Elasticsearch URL.")
+    es_cloud_id: str = Field(default=None, description="Elasticsearch cloud ID.")
+    es_api_key: str = Field(default=None, description="Elasticsearch API key.")
+    es_user: str = Field(default=None, description="Elasticsearch username.")
+    es_password: str = Field(default=None, description="Elasticsearch password.")
+    batch_size: int = Field(default=200, description="Batch size for bulk indexing.")
+    distance_strategy: str = Field(default="COSINE", description="Distance strategy to use for similarity search.")
+
+
+class ElasticsearchRetrieverConfig(IndexRetrieverConfig):
+    """Config for Elasticsearch-based retrievers. Support both vector and text."""
+
+    store_config: ElasticsearchStoreConfig = Field(..., description="ElasticsearchStore config.")
+    vector_store_query_mode: VectorStoreQueryMode = Field(
+        default=VectorStoreQueryMode.DEFAULT, description="default is vector query."
+    )
+
+
+class ElasticsearchKeywordRetrieverConfig(ElasticsearchRetrieverConfig):
+    """Config for Elasticsearch-based retrievers. Support text only."""
+
+    _no_embedding: bool = PrivateAttr(default=True)
+    vector_store_query_mode: Literal[VectorStoreQueryMode.TEXT_SEARCH] = Field(
+        default=VectorStoreQueryMode.TEXT_SEARCH, description="text query only."
+    )
+
+
+class BaseRankerConfig(BaseModel):
+    """Common config for rankers.
+
+    If add new subconfig, it is necessary to add the corresponding instance implementation in rag.factories.ranker.
+    """
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+    top_n: int = Field(default=5, description="The number of top results to return.")
+
+
+class LLMRankerConfig(BaseRankerConfig):
+    """Config for LLM-based rankers."""
+
+    llm: Any = Field(
+        default=None,
+        description="The LLM to rerank with. using Any instead of LLM, as llama_index.core.llms.LLM is pydantic.v1.",
+    )
+
+
+class ColbertRerankConfig(BaseRankerConfig):
+    model: str = Field(default="colbert-ir/colbertv2.0", description="Colbert model name.")
+    device: str = Field(default="cpu", description="Device to use for sentence transformer.")
+    keep_retrieval_score: bool = Field(default=False, description="Whether to keep the retrieval score in metadata.")
+
+
+class ObjectRankerConfig(BaseRankerConfig):
+    field_name: str = Field(..., description="field name of the object, field's value must can be compared.")
+    order: Literal["desc", "asc"] = Field(default="desc", description="the direction of order.")
+
+
+class BaseIndexConfig(BaseModel):
+    """Common config for index.
+
+    If add new subconfig, it is necessary to add the corresponding instance implementation in rag.factories.index.
+    """
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+    persist_path: Union[str, Path] = Field(description="The directory of saved data.")
+
+
+class VectorIndexConfig(BaseIndexConfig):
+    """Config for vector-based index."""
+
+    embed_model: BaseEmbedding = Field(default=None, description="Embed model.")
+
+
+class FAISSIndexConfig(VectorIndexConfig):
+    """Config for faiss-based index."""
+
+
+class ChromaIndexConfig(VectorIndexConfig):
+    """Config for chroma-based index."""
+
+    collection_name: str = Field(default="metagpt", description="The name of the collection.")
+
+
+class BM25IndexConfig(BaseIndexConfig):
+    """Config for bm25-based index."""
+
+    _no_embedding: bool = PrivateAttr(default=True)
+
+
+class ElasticsearchIndexConfig(VectorIndexConfig):
+    """Config for es-based index."""
+
+    store_config: ElasticsearchStoreConfig = Field(..., description="ElasticsearchStore config.")
+    persist_path: Union[str, Path] = ""
+
+
+class ElasticsearchKeywordIndexConfig(ElasticsearchIndexConfig):
+    """Config for es-based index. no embedding."""
+
+    _no_embedding: bool = PrivateAttr(default=True)
+
+
+class ObjectNodeMetadata(BaseModel):
+    """Metadata of ObjectNode."""
+
+    is_obj: bool = Field(default=True)
+    obj: Any = Field(default=None, description="When rag retrieve, will reconstruct obj from obj_json")
+    obj_json: str = Field(..., description="The json of object, e.g. obj.model_dump_json()")
+    obj_cls_name: str = Field(..., description="The class name of object, e.g. obj.__class__.__name__")
+    obj_mod_name: str = Field(..., description="The module name of class, e.g. obj.__class__.__module__")
+
+
+class ObjectNode(TextNode):
+    """RAG add object."""
+
+    def __init__(self, **kwargs):
+        super().__init__(**kwargs)
+        self.excluded_llm_metadata_keys = list(ObjectNodeMetadata.model_fields.keys())
+        self.excluded_embed_metadata_keys = self.excluded_llm_metadata_keys
+
+    @staticmethod
+    def get_obj_metadata(obj: RAGObject) -> dict:
+        metadata = ObjectNodeMetadata(
+            obj_json=obj.model_dump_json(), obj_cls_name=obj.__class__.__name__, obj_mod_name=obj.__class__.__module__
+        )
+
+        return metadata.model_dump()
diff --git a/metagpt/roles/__init__.py b/metagpt/roles/__init__.py
index f033a5dfa..08a0406b3 100644
--- a/metagpt/roles/__init__.py
+++ b/metagpt/roles/__init__.py
@@ -14,7 +14,6 @@ from metagpt.roles.engineer import Engineer
 from metagpt.roles.qa_engineer import QaEngineer
 from metagpt.roles.searcher import Searcher
 from metagpt.roles.sales import Sales
-from metagpt.roles.customer_service import CustomerService
 
 
 __all__ = [
@@ -26,5 +25,4 @@ __all__ = [
     "QaEngineer",
     "Searcher",
     "Sales",
-    "CustomerService",
 ]
diff --git a/metagpt/roles/engineer.py b/metagpt/roles/engineer.py
index 329b21553..9d8f6884f 100644
--- a/metagpt/roles/engineer.py
+++ b/metagpt/roles/engineer.py
@@ -240,8 +240,8 @@ class Engineer(Role):
     async def _think(self) -> Action | None:
         if not self.src_workspace:
             self.src_workspace = self.git_repo.workdir / self.git_repo.workdir.name
-        write_plan_and_change_filters = any_to_str_set([WriteTasks])
-        write_code_filters = any_to_str_set([WriteTasks, WriteCodePlanAndChange, SummarizeCode, FixBug])
+        write_plan_and_change_filters = any_to_str_set([WriteTasks, FixBug])
+        write_code_filters = any_to_str_set([WriteTasks, WriteCodePlanAndChange, SummarizeCode])
         summarize_code_filters = any_to_str_set([WriteCode, WriteCodeReview])
         if not self.rc.news:
             return None
diff --git a/metagpt/roles/role.py b/metagpt/roles/role.py
index 832a000b1..e0f8a7ea6 100644
--- a/metagpt/roles/role.py
+++ b/metagpt/roles/role.py
@@ -108,12 +108,6 @@ class RoleContext(BaseModel):
     )  # see `Role._set_react_mode` for definitions of the following two attributes
     max_react_loop: int = 1
 
-    def check(self, role_id: str):
-        # if hasattr(CONFIG, "enable_longterm_memory") and CONFIG.enable_longterm_memory:
-        #     self.long_term_memory.recover_memory(role_id, self)
-        #     self.memory = self.long_term_memory  # use memory to act as long_term_memory for unify operation
-        pass
-
     @property
     def important_memory(self) -> list[Message]:
         """Retrieve information corresponding to the attention action."""
@@ -175,6 +169,7 @@ class Role(SerializationMixin, ContextMixin, BaseModel):
 
         self._check_actions()
         self.llm.system_prompt = self._get_prefix()
+        self.llm.cost_manager = self.context.cost_manager
         self._watch(kwargs.pop("watch", [UserRequirement]))
 
         if self.latest_observed_msg:
@@ -311,8 +306,6 @@ class Role(SerializationMixin, ContextMixin, BaseModel):
         buffer during _observe.
         """
         self.rc.watch = {any_to_str(t) for t in actions}
-        # check RoleContext after adding watch actions
-        self.rc.check(self.role_id)
 
     def is_watch(self, caused_by: str):
         return caused_by in self.rc.watch
@@ -339,6 +332,7 @@ class Role(SerializationMixin, ContextMixin, BaseModel):
         if env:
             env.set_addresses(self, self.addresses)
             self.llm.system_prompt = self._get_prefix()
+            self.llm.cost_manager = self.context.cost_manager
             self.set_actions(self.actions)  # reset actions to update llm and prefix
 
     def _get_prefix(self):
diff --git a/metagpt/roles/sales.py b/metagpt/roles/sales.py
index bc449b5cd..e5cb12778 100644
--- a/metagpt/roles/sales.py
+++ b/metagpt/roles/sales.py
@@ -11,7 +11,6 @@ from typing import Optional
 from pydantic import Field, model_validator
 
 from metagpt.actions import SearchAndSummarize, UserRequirement
-from metagpt.document_store.base_store import BaseStore
 from metagpt.roles import Role
 from metagpt.tools.search_engine import SearchEngine
 
@@ -27,7 +26,7 @@ class Sales(Role):
         "delivered with the professionalism and courtesy expected of a seasoned sales guide."
     )
 
-    store: Optional[BaseStore] = Field(default=None, exclude=True)
+    store: Optional[object] = Field(default=None, exclude=True)  # must inplement tools.SearchInterface
 
     @model_validator(mode="after")
     def validate_stroe(self):
diff --git a/metagpt/schema.py b/metagpt/schema.py
index 7906febe0..45c7480f9 100644
--- a/metagpt/schema.py
+++ b/metagpt/schema.py
@@ -233,6 +233,10 @@ class Message(BaseModel):
     def check_send_to(cls, send_to: Any) -> set:
         return any_to_str_set(send_to if send_to else {MESSAGE_ROUTE_TO_ALL})
 
+    @field_serializer("send_to", mode="plain")
+    def ser_send_to(self, send_to: set) -> list:
+        return list(send_to)
+
     @field_serializer("instruct_content", mode="plain")
     def ser_instruct_content(self, ic: BaseModel) -> Union[dict, None]:
         ic_dict = None
@@ -276,6 +280,10 @@ class Message(BaseModel):
     def __repr__(self):
         return self.__str__()
 
+    def rag_key(self) -> str:
+        """For search"""
+        return self.content
+
     def to_dict(self) -> dict:
         """Return a dict containing `role` and `content` for the LLM call.l"""
         return {"role": self.role, "content": self.content}
diff --git a/metagpt/startup.py b/metagpt/startup.py
new file mode 100644
index 000000000..bb6f6abf2
--- /dev/null
+++ b/metagpt/startup.py
@@ -0,0 +1,10 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+"""
+@Time    : 2024/3/11 19:16
+@Author  : alexanderwu
+@File    : startup.py
+"""
+
+# DEPRECATED: This file is deprecated and will be removed in the future.
+# The startup.py implementation has been moved to software_company.py
diff --git a/metagpt/tools/__init__.py b/metagpt/tools/__init__.py
index c1f604df9..35fa04658 100644
--- a/metagpt/tools/__init__.py
+++ b/metagpt/tools/__init__.py
@@ -19,6 +19,7 @@ class SearchEngineType(Enum):
     DIRECT_GOOGLE = "google"
     DUCK_DUCK_GO = "ddg"
     CUSTOM_ENGINE = "custom"
+    BING = "bing"
 
 
 class WebBrowserEngineType(Enum):
@@ -30,3 +31,8 @@ class WebBrowserEngineType(Enum):
     def __missing__(cls, key):
         """Default type conversion"""
         return cls.CUSTOM
+
+
+class SearchInterface:
+    async def asearch(self, *args, **kwargs):
+        ...
diff --git a/metagpt/tools/search_engine.py b/metagpt/tools/search_engine.py
index 1e540bd0e..767f4aaba 100644
--- a/metagpt/tools/search_engine.py
+++ b/metagpt/tools/search_engine.py
@@ -88,6 +88,9 @@ class SearchEngine(BaseModel):
             run_func = importlib.import_module(module).DDGAPIWrapper(**kwargs).run
         elif self.engine == SearchEngineType.CUSTOM_ENGINE:
             run_func = self.run_func
+        elif self.engine == SearchEngineType.BING:
+            module = "metagpt.tools.search_engine_bing"
+            run_func = importlib.import_module(module).BingAPIWrapper(**kwargs).run
         else:
             raise NotImplementedError
         self.run_func = run_func
diff --git a/metagpt/tools/search_engine_bing.py b/metagpt/tools/search_engine_bing.py
new file mode 100644
index 000000000..0bc5b5d13
--- /dev/null
+++ b/metagpt/tools/search_engine_bing.py
@@ -0,0 +1,106 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+from __future__ import annotations
+
+import json
+import warnings
+from typing import Optional
+
+import aiohttp
+from pydantic import BaseModel, ConfigDict, model_validator
+
+
+class BingAPIWrapper(BaseModel):
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+
+    api_key: str
+    bing_url: str = "https://api.bing.microsoft.com/v7.0/search"
+    aiosession: Optional[aiohttp.ClientSession] = None
+    proxy: Optional[str] = None
+
+    @model_validator(mode="before")
+    @classmethod
+    def validate_api_key(cls, values: dict) -> dict:
+        if "api_key" in values:
+            values.setdefault("api_key", values["api_key"])
+            warnings.warn("`api_key` is deprecated, use `api_key` instead", DeprecationWarning, stacklevel=2)
+        return values
+
+    @property
+    def header(self):
+        return {"Ocp-Apim-Subscription-Key": self.api_key}
+
+    async def run(
+        self,
+        query: str,
+        max_results: int = 8,
+        as_string: bool = True,
+        focus: list[str] | None = None,
+    ) -> str | list[dict]:
+        """Return the results of a Google search using the official Bing API.
+
+        Args:
+            query: The search query.
+            max_results: The number of results to return.
+            as_string: A boolean flag to determine the return type of the results. If True, the function will
+                return a formatted string with the search results. If False, it will return a list of dictionaries
+                containing detailed information about each search result.
+            focus: Specific information to be focused on from each search result.
+
+        Returns:
+            The results of the search.
+        """
+        params = {
+            "q": query,
+            "count": max_results,
+            "textFormat": "HTML",
+        }
+        result = await self.results(params)
+        search_results = result["webPages"]["value"]
+        focus = focus or ["snippet", "link", "title"]
+        for item_dict in search_results:
+            item_dict["link"] = item_dict["url"]
+            item_dict["title"] = item_dict["name"]
+        details = [{i: j for i, j in item_dict.items() if i in focus} for item_dict in search_results]
+        if as_string:
+            return safe_results(details)
+        return details
+
+    async def results(self, params: dict) -> dict:
+        """Use aiohttp to run query and return the results async."""
+
+        if not self.aiosession:
+            async with aiohttp.ClientSession() as session:
+                async with session.get(self.bing_url, params=params, headers=self.header, proxy=self.proxy) as response:
+                    response.raise_for_status()
+                    res = await response.json()
+        else:
+            async with self.aiosession.get(
+                self.bing_url, params=params, headers=self.header, proxy=self.proxy
+            ) as response:
+                response.raise_for_status()
+                res = await response.json()
+
+        return res
+
+
+def safe_results(results: str | list) -> str:
+    """Return the results of a bing search in a safe format.
+
+    Args:
+        results: The search results.
+
+    Returns:
+        The results of the search.
+    """
+    if isinstance(results, list):
+        safe_message = json.dumps([result for result in results])
+    else:
+        safe_message = results.encode("utf-8", "ignore").decode("utf-8")
+    return safe_message
+
+
+if __name__ == "__main__":
+    import fire
+
+    fire.Fire(BingAPIWrapper().run)
diff --git a/metagpt/tools/web_browser_engine_selenium.py b/metagpt/tools/web_browser_engine_selenium.py
index 3b1682291..786715461 100644
--- a/metagpt/tools/web_browser_engine_selenium.py
+++ b/metagpt/tools/web_browser_engine_selenium.py
@@ -103,7 +103,7 @@ class WDMHttpProxyClient(WDMHttpClient):
 
     def get(self, url, **kwargs):
         if "proxies" not in kwargs and self.proxy:
-            kwargs["proxies"] = {"all_proxy": self.proxy}
+            kwargs["proxies"] = {"all": self.proxy}
         return super().get(url, **kwargs)
 
 
diff --git a/metagpt/utils/async_helper.py b/metagpt/utils/async_helper.py
new file mode 100644
index 000000000..ee440ef44
--- /dev/null
+++ b/metagpt/utils/async_helper.py
@@ -0,0 +1,22 @@
+import asyncio
+import threading
+from typing import Any
+
+
+def run_coroutine_in_new_loop(coroutine) -> Any:
+    """Runs a coroutine in a new, separate event loop on a different thread.
+
+    This function is useful when try to execute an async function within a sync function, but encounter the error `RuntimeError: This event loop is already running`.
+    """
+    new_loop = asyncio.new_event_loop()
+    t = threading.Thread(target=lambda: new_loop.run_forever())
+    t.start()
+
+    future = asyncio.run_coroutine_threadsafe(coroutine, new_loop)
+
+    try:
+        return future.result()
+    finally:
+        new_loop.call_soon_threadsafe(new_loop.stop)
+        t.join()
+        new_loop.close()
diff --git a/metagpt/utils/common.py b/metagpt/utils/common.py
index e9cef69a4..e443c3466 100644
--- a/metagpt/utils/common.py
+++ b/metagpt/utils/common.py
@@ -18,6 +18,7 @@ import csv
 import importlib
 import inspect
 import json
+import mimetypes
 import os
 import platform
 import re
@@ -29,6 +30,7 @@ from typing import Any, Callable, List, Literal, Tuple, Union
 from urllib.parse import quote, unquote
 
 import aiofiles
+import chardet
 import loguru
 import requests
 from PIL import Image
@@ -663,14 +665,21 @@ def role_raise_decorator(func):
 
 
 @handle_exception
-async def aread(filename: str | Path, encoding=None) -> str:
+async def aread(filename: str | Path, encoding="utf-8") -> str:
     """Read file asynchronously."""
-    async with aiofiles.open(str(filename), mode="r", encoding=encoding) as reader:
-        content = await reader.read()
+    try:
+        async with aiofiles.open(str(filename), mode="r", encoding=encoding) as reader:
+            content = await reader.read()
+    except UnicodeDecodeError:
+        async with aiofiles.open(str(filename), mode="rb") as reader:
+            raw = await reader.read()
+            result = chardet.detect(raw)
+            detected_encoding = result["encoding"]
+            content = raw.decode(detected_encoding)
     return content
 
 
-async def awrite(filename: str | Path, data: str, encoding=None):
+async def awrite(filename: str | Path, data: str, encoding="utf-8"):
     """Write file asynchronously."""
     pathname = Path(filename)
     pathname.parent.mkdir(parents=True, exist_ok=True)
@@ -765,7 +774,7 @@ def is_coroutine_func(func: Callable) -> bool:
 
 
 def load_mc_skills_code(skill_names: list[str] = None, skills_dir: Path = None) -> list[str]:
-    """load mincraft skill from js files"""
+    """load minecraft skill from js files"""
     if not skills_dir:
         skills_dir = Path(__file__).parent.absolute()
     if skill_names is None:
@@ -802,29 +811,6 @@ def decode_image(img_url_or_b64: str) -> Image:
     return img
 
 
-def process_message(messages: Union[str, Message, list[dict], list[Message], list[str]]) -> list[dict]:
-    """convert messages to list[dict]."""
-    from metagpt.schema import Message
-
-    # 全部转成list
-    if not isinstance(messages, list):
-        messages = [messages]
-
-    # 转成list[dict]
-    processed_messages = []
-    for msg in messages:
-        if isinstance(msg, str):
-            processed_messages.append({"role": "user", "content": msg})
-        elif isinstance(msg, dict):
-            assert set(msg.keys()) == set(["role", "content"])
-            processed_messages.append(msg)
-        elif isinstance(msg, Message):
-            processed_messages.append(msg.to_dict())
-        else:
-            raise ValueError(f"Only support message type are: str, Message, dict, but got {type(messages).__name__}!")
-    return processed_messages
-
-
 def log_and_reraise(retry_state: RetryCallState):
     logger.error(f"Retry attempts exhausted. Last exception: {retry_state.outcome.exception()}")
     logger.warning(
@@ -834,3 +820,21 @@ See FAQ 5.8
 """
     )
     raise retry_state.outcome.exception()
+
+
+def get_markdown_codeblock_type(filename: str) -> str:
+    """Return the markdown code-block type corresponding to the file extension."""
+    mime_type, _ = mimetypes.guess_type(filename)
+    mappings = {
+        "text/x-shellscript": "bash",
+        "text/x-c++src": "cpp",
+        "text/css": "css",
+        "text/html": "html",
+        "text/x-java": "java",
+        "application/javascript": "javascript",
+        "application/json": "json",
+        "text/x-python": "python",
+        "text/x-ruby": "ruby",
+        "application/sql": "sql",
+    }
+    return mappings.get(mime_type, "text")
diff --git a/metagpt/utils/dependency_file.py b/metagpt/utils/dependency_file.py
index d3add1171..0a375051c 100644
--- a/metagpt/utils/dependency_file.py
+++ b/metagpt/utils/dependency_file.py
@@ -13,9 +13,7 @@ import re
 from pathlib import Path
 from typing import Set
 
-import aiofiles
-
-from metagpt.utils.common import aread
+from metagpt.utils.common import aread, awrite
 from metagpt.utils.exceptions import handle_exception
 
 
@@ -45,8 +43,7 @@ class DependencyFile:
     async def save(self):
         """Save dependencies to the file asynchronously."""
         data = json.dumps(self._dependencies)
-        async with aiofiles.open(str(self._filename), mode="w") as writer:
-            await writer.write(data)
+        await awrite(filename=self._filename, data=data)
 
     async def update(self, filename: Path | str, dependencies: Set[Path | str], persist=True):
         """Update dependencies for a file asynchronously.
diff --git a/metagpt/utils/embedding.py b/metagpt/utils/embedding.py
index 21d62948c..3d53a314c 100644
--- a/metagpt/utils/embedding.py
+++ b/metagpt/utils/embedding.py
@@ -5,12 +5,15 @@
 @Author  : alexanderwu
 @File    : embedding.py
 """
-from langchain_community.embeddings import OpenAIEmbeddings
+from llama_index.embeddings.openai import OpenAIEmbedding
 
 from metagpt.config2 import config
 
 
-def get_embedding():
+def get_embedding() -> OpenAIEmbedding:
     llm = config.get_openai_llm()
-    embedding = OpenAIEmbeddings(openai_api_key=llm.api_key, openai_api_base=llm.base_url)
+    if llm is None:
+        raise ValueError("To use OpenAIEmbedding, please ensure that config.llm.api_type is correctly set to 'openai'.")
+
+    embedding = OpenAIEmbedding(api_key=llm.api_key, api_base=llm.base_url)
     return embedding
diff --git a/metagpt/utils/file_repository.py b/metagpt/utils/file_repository.py
index d2a06963a..d19f2b705 100644
--- a/metagpt/utils/file_repository.py
+++ b/metagpt/utils/file_repository.py
@@ -14,11 +14,9 @@ from datetime import datetime
 from pathlib import Path
 from typing import Dict, List, Set
 
-import aiofiles
-
 from metagpt.logs import logger
 from metagpt.schema import Document
-from metagpt.utils.common import aread
+from metagpt.utils.common import aread, awrite
 from metagpt.utils.json_to_markdown import json_to_markdown
 
 
@@ -55,8 +53,7 @@ class FileRepository:
         pathname = self.workdir / filename
         pathname.parent.mkdir(parents=True, exist_ok=True)
         content = content if content else ""  # avoid `argument must be str, not None` to make it continue
-        async with aiofiles.open(str(pathname), mode="w") as writer:
-            await writer.write(content)
+        await awrite(filename=str(pathname), data=content)
         logger.info(f"save to: {str(pathname)}")
 
         if dependencies is not None:
diff --git a/metagpt/utils/mermaid.py b/metagpt/utils/mermaid.py
index ae3c5118f..e1d140e84 100644
--- a/metagpt/utils/mermaid.py
+++ b/metagpt/utils/mermaid.py
@@ -9,11 +9,9 @@ import asyncio
 import os
 from pathlib import Path
 
-import aiofiles
-
 from metagpt.config2 import config
 from metagpt.logs import logger
-from metagpt.utils.common import check_cmd_exists
+from metagpt.utils.common import awrite, check_cmd_exists
 
 
 async def mermaid_to_file(engine, mermaid_code, output_file_without_suffix, width=2048, height=2048) -> int:
@@ -30,9 +28,7 @@ async def mermaid_to_file(engine, mermaid_code, output_file_without_suffix, widt
     if dir_name and not os.path.exists(dir_name):
         os.makedirs(dir_name)
     tmp = Path(f"{output_file_without_suffix}.mmd")
-    async with aiofiles.open(tmp, "w", encoding="utf-8") as f:
-        await f.write(mermaid_code)
-    # tmp.write_text(mermaid_code, encoding="utf-8")
+    await awrite(filename=tmp, data=mermaid_code)
 
     if engine == "nodejs":
         if check_cmd_exists(config.mermaid.path) != 0:
diff --git a/metagpt/utils/recovery_util.py b/metagpt/utils/recovery_util.py
index d0b197e69..2089ae018 100644
--- a/metagpt/utils/recovery_util.py
+++ b/metagpt/utils/recovery_util.py
@@ -54,5 +54,5 @@ def save_history(role: Role, save_dir: str = ""):
     with open(save_path / "plan.json", "w", encoding="utf-8") as plan_file:
         json.dump(plan, plan_file, indent=4, ensure_ascii=False)
 
-    save_code_file(name=Path(record_time) / "history_nb", code_context=role.execute_code.nb, file_format="ipynb")
+    save_code_file(name=Path(record_time), code_context=role.execute_code.nb, file_format="ipynb")
     return save_path
diff --git a/metagpt/utils/reflection.py b/metagpt/utils/reflection.py
new file mode 100644
index 000000000..8b8237ae7
--- /dev/null
+++ b/metagpt/utils/reflection.py
@@ -0,0 +1,18 @@
+"""class tools, including method inspection, class attributes, inheritance relationships, etc."""
+
+
+def check_methods(C, *methods):
+    """Check if the class has methods. borrow from _collections_abc.
+
+    Useful when implementing implicit interfaces, such as defining an abstract class, isinstance can be used for determination without inheritance.
+    """
+    mro = C.__mro__
+    for method in methods:
+        for B in mro:
+            if method in B.__dict__:
+                if B.__dict__[method] is None:
+                    return NotImplemented
+                break
+        else:
+            return NotImplemented
+    return True
diff --git a/metagpt/utils/repair_llm_raw_output.py b/metagpt/utils/repair_llm_raw_output.py
index b8756e8c6..17e095c5f 100644
--- a/metagpt/utils/repair_llm_raw_output.py
+++ b/metagpt/utils/repair_llm_raw_output.py
@@ -340,7 +340,9 @@ def extract_state_value_from_output(content: str) -> str:
         content (str): llm's output from `Role._think`
     """
     content = content.strip()  # deal the output cases like " 0", "0\n" and so on.
-    pattern = r"([0-9])"  # TODO find the number using a more proper method not just extract from content using pattern
+    pattern = (
+        r"(?<!-)[0-9]"  # TODO find the number using a more proper method not just extract from content using pattern
+    )
     matches = re.findall(pattern, content, re.DOTALL)
     matches = list(set(matches))
     state = matches[0] if len(matches) > 0 else "-1"
diff --git a/metagpt/utils/repo_to_markdown.py b/metagpt/utils/repo_to_markdown.py
new file mode 100644
index 000000000..76dfe1b82
--- /dev/null
+++ b/metagpt/utils/repo_to_markdown.py
@@ -0,0 +1,80 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+"""
+This file provides functionality to convert a local repository into a markdown representation.
+"""
+from __future__ import annotations
+
+import mimetypes
+from pathlib import Path
+
+from gitignore_parser import parse_gitignore
+
+from metagpt.logs import logger
+from metagpt.utils.common import aread, awrite, get_markdown_codeblock_type, list_files
+from metagpt.utils.tree import tree
+
+
+async def repo_to_markdown(repo_path: str | Path, output: str | Path = None, gitignore: str | Path = None) -> str:
+    """
+    Convert a local repository into a markdown representation.
+
+    This function takes a path to a local repository and generates a markdown representation of the repository structure,
+    including directory trees and file listings.
+
+    Args:
+        repo_path (str | Path): The path to the local repository.
+        output (str | Path, optional): The path to save the generated markdown file. Defaults to None.
+        gitignore (str | Path, optional): The path to the .gitignore file. Defaults to None.
+
+    Returns:
+        str: The markdown representation of the repository.
+    """
+    repo_path = Path(repo_path)
+    gitignore = Path(gitignore or Path(__file__).parent / "../../.gitignore").resolve()
+
+    markdown = await _write_dir_tree(repo_path=repo_path, gitignore=gitignore)
+
+    gitignore_rules = parse_gitignore(full_path=str(gitignore))
+    markdown += await _write_files(repo_path=repo_path, gitignore_rules=gitignore_rules)
+
+    if output:
+        await awrite(filename=str(output), data=markdown, encoding="utf-8")
+    return markdown
+
+
+async def _write_dir_tree(repo_path: Path, gitignore: Path) -> str:
+    try:
+        content = tree(repo_path, gitignore, run_command=True)
+    except Exception as e:
+        logger.info(f"{e}, using safe mode.")
+        content = tree(repo_path, gitignore, run_command=False)
+
+    doc = f"## Directory Tree\n```text\n{content}\n```\n---\n\n"
+    return doc
+
+
+async def _write_files(repo_path, gitignore_rules) -> str:
+    filenames = list_files(repo_path)
+    markdown = ""
+    for filename in filenames:
+        if gitignore_rules(str(filename)):
+            continue
+        markdown += await _write_file(filename=filename, repo_path=repo_path)
+    return markdown
+
+
+async def _write_file(filename: Path, repo_path: Path) -> str:
+    relative_path = filename.relative_to(repo_path)
+    markdown = f"## {relative_path}\n"
+
+    mime_type, _ = mimetypes.guess_type(filename.name)
+    if "text/" not in mime_type:
+        logger.info(f"Ignore content: {filename}")
+        markdown += "<binary file>\n---\n\n"
+        return markdown
+    content = await aread(filename, encoding="utf-8")
+    content = content.replace("```", "\\`\\`\\`").replace("---", "\\-\\-\\-")
+    code_block_type = get_markdown_codeblock_type(filename.name)
+    markdown += f"```{code_block_type}\n{content}\n```\n---\n\n"
+    return markdown
diff --git a/metagpt/utils/token_counter.py b/metagpt/utils/token_counter.py
index f7c53706b..0ba2daa89 100644
--- a/metagpt/utils/token_counter.py
+++ b/metagpt/utils/token_counter.py
@@ -21,6 +21,7 @@ TOKEN_COSTS = {
     "gpt-35-turbo": {"prompt": 0.0015, "completion": 0.002},
     "gpt-35-turbo-16k": {"prompt": 0.003, "completion": 0.004},
     "gpt-3.5-turbo-1106": {"prompt": 0.001, "completion": 0.002},
+    "gpt-3.5-turbo-0125": {"prompt": 0.001, "completion": 0.002},
     "gpt-4-0314": {"prompt": 0.03, "completion": 0.06},
     "gpt-4": {"prompt": 0.03, "completion": 0.06},
     "gpt-4-32k": {"prompt": 0.06, "completion": 0.12},
@@ -48,6 +49,8 @@ TOKEN_COSTS = {
     "claude-2.1": {"prompt": 0.008, "completion": 0.024},
     "claude-3-sonnet-20240229": {"prompt": 0.003, "completion": 0.015},
     "claude-3-opus-20240229": {"prompt": 0.015, "completion": 0.075},
+    "yi-34b-chat-0205": {"prompt": 0.0003, "completion": 0.0003},
+    "yi-34b-chat-200k": {"prompt": 0.0017, "completion": 0.0017},
 }
 
 
@@ -140,25 +143,24 @@ FIREWORKS_GRADE_TOKEN_COSTS = {
     "mixtral-8x7b": {"prompt": 0.4, "completion": 1.6},
 }
 
+# https://platform.openai.com/docs/models/gpt-4-and-gpt-4-turbo
 TOKEN_MAX = {
-    "gpt-3.5-turbo": 4096,
-    "gpt-3.5-turbo-0301": 4096,
-    "gpt-3.5-turbo-0613": 4096,
-    "gpt-3.5-turbo-16k": 16384,
-    "gpt-3.5-turbo-16k-0613": 16384,
-    "gpt-35-turbo": 4096,
-    "gpt-35-turbo-16k": 16384,
-    "gpt-3.5-turbo-1106": 16384,
-    "gpt-4-0314": 8192,
-    "gpt-4": 8192,
-    "gpt-4-32k": 32768,
-    "gpt-4-32k-0314": 32768,
-    "gpt-4-0613": 8192,
-    "gpt-4-turbo-preview": 128000,
     "gpt-4-0125-preview": 128000,
+    "gpt-4-turbo-preview": 128000,
     "gpt-4-1106-preview": 128000,
     "gpt-4-vision-preview": 128000,
     "gpt-4-1106-vision-preview": 128000,
+    "gpt-4": 8192,
+    "gpt-4-0613": 8192,
+    "gpt-4-32k": 32768,
+    "gpt-4-32k-0613": 32768,
+    "gpt-3.5-turbo-0125": 16385,
+    "gpt-3.5-turbo": 16385,
+    "gpt-3.5-turbo-1106": 16385,
+    "gpt-3.5-turbo-instruct": 4096,
+    "gpt-3.5-turbo-16k": 16385,
+    "gpt-3.5-turbo-0613": 4096,
+    "gpt-3.5-turbo-16k-0613": 16385,
     "text-embedding-ada-002": 8192,
     "glm-3-turbo": 128000,
     "glm-4": 128000,
@@ -176,10 +178,12 @@ TOKEN_MAX = {
     "claude-2.1": 200000,
     "claude-3-sonnet-20240229": 200000,
     "claude-3-opus-20240229": 200000,
+    "yi-34b-chat-0205": 4000,
+    "yi-34b-chat-200k": 200000,
 }
 
 
-def count_message_tokens(messages, model="gpt-3.5-turbo-0613"):
+def count_message_tokens(messages, model="gpt-3.5-turbo-0125"):
     """Return the number of tokens used by a list of messages."""
     try:
         encoding = tiktoken.encoding_for_model(model)
@@ -193,6 +197,7 @@ def count_message_tokens(messages, model="gpt-3.5-turbo-0613"):
         "gpt-35-turbo-16k",
         "gpt-3.5-turbo-16k",
         "gpt-3.5-turbo-1106",
+        "gpt-3.5-turbo-0125",
         "gpt-4-0314",
         "gpt-4-32k-0314",
         "gpt-4-0613",
@@ -209,8 +214,8 @@ def count_message_tokens(messages, model="gpt-3.5-turbo-0613"):
         tokens_per_message = 4  # every message follows <|start|>{role/name}\n{content}<|end|>\n
         tokens_per_name = -1  # if there's a name, the role is omitted
     elif "gpt-3.5-turbo" == model:
-        print("Warning: gpt-3.5-turbo may update over time. Returning num tokens assuming gpt-3.5-turbo-0613.")
-        return count_message_tokens(messages, model="gpt-3.5-turbo-0613")
+        print("Warning: gpt-3.5-turbo may update over time. Returning num tokens assuming gpt-3.5-turbo-0125.")
+        return count_message_tokens(messages, model="gpt-3.5-turbo-0125")
     elif "gpt-4" == model:
         print("Warning: gpt-4 may update over time. Returning num tokens assuming gpt-4-0613.")
         return count_message_tokens(messages, model="gpt-4-0613")
@@ -224,7 +229,7 @@ def count_message_tokens(messages, model="gpt-3.5-turbo-0613"):
     else:
         raise NotImplementedError(
             f"num_tokens_from_messages() is not implemented for model {model}. "
-            f"See https://github.com/openai/openai-python/blob/main/chatml.md "
+            f"See https://cookbook.openai.com/examples/how_to_count_tokens_with_tiktoken "
             f"for information on how messages are converted to tokens."
         )
     num_tokens = 0
diff --git a/metagpt/utils/tree.py b/metagpt/utils/tree.py
new file mode 100644
index 000000000..bd7922290
--- /dev/null
+++ b/metagpt/utils/tree.py
@@ -0,0 +1,140 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+"""
+@Time    : 2024/3/11
+@Author  : mashenquan
+@File    : tree.py
+@Desc    : Implement the same functionality as the `tree` command.
+        Example:
+            >>> print_tree(".")
+            utils
+            +-- serialize.py
+            +-- project_repo.py
+            +-- tree.py
+            +-- mmdc_playwright.py
+            +-- cost_manager.py
+            +-- __pycache__
+            |   +-- __init__.cpython-39.pyc
+            |   +-- redis.cpython-39.pyc
+            |   +-- singleton.cpython-39.pyc
+            |   +-- embedding.cpython-39.pyc
+            |   +-- make_sk_kernel.cpython-39.pyc
+            |   +-- file_repository.cpython-39.pyc
+            +-- file.py
+            +-- save_code.py
+            +-- common.py
+            +-- redis.py
+"""
+from __future__ import annotations
+
+import subprocess
+from pathlib import Path
+from typing import Callable, Dict, List
+
+from gitignore_parser import parse_gitignore
+
+
+def tree(root: str | Path, gitignore: str | Path = None, run_command: bool = False) -> str:
+    """
+    Recursively traverses the directory structure and prints it out in a tree-like format.
+
+    Args:
+        root (str or Path): The root directory from which to start traversing.
+        gitignore (str or Path): The filename of gitignore file.
+        run_command (bool): Whether to execute `tree` command. Execute the `tree` command and return the result if True,
+            otherwise execute python code instead.
+
+    Returns:
+        str: A string representation of the directory tree.
+
+    Example:
+            >>> tree(".")
+            utils
+            +-- serialize.py
+            +-- project_repo.py
+            +-- tree.py
+            +-- mmdc_playwright.py
+            +-- __pycache__
+            |   +-- __init__.cpython-39.pyc
+            |   +-- redis.cpython-39.pyc
+            |   +-- singleton.cpython-39.pyc
+            +-- parse_docstring.py
+
+            >>> tree(".", gitignore="../../.gitignore")
+            utils
+            +-- serialize.py
+            +-- project_repo.py
+            +-- tree.py
+            +-- mmdc_playwright.py
+            +-- parse_docstring.py
+
+            >>> tree(".", gitignore="../../.gitignore", run_command=True)
+            utils
+            ├── serialize.py
+            ├── project_repo.py
+            ├── tree.py
+            ├── mmdc_playwright.py
+            └── parse_docstring.py
+
+
+    """
+    root = Path(root).resolve()
+    if run_command:
+        return _execute_tree(root, gitignore)
+
+    git_ignore_rules = parse_gitignore(gitignore) if gitignore else None
+    dir_ = {root.name: _list_children(root=root, git_ignore_rules=git_ignore_rules)}
+    v = _print_tree(dir_)
+    return "\n".join(v)
+
+
+def _list_children(root: Path, git_ignore_rules: Callable) -> Dict[str, Dict]:
+    dir_ = {}
+    for i in root.iterdir():
+        if git_ignore_rules and git_ignore_rules(str(i)):
+            continue
+        try:
+            if i.is_file():
+                dir_[i.name] = {}
+            else:
+                dir_[i.name] = _list_children(root=i, git_ignore_rules=git_ignore_rules)
+        except (FileNotFoundError, PermissionError, OSError):
+            dir_[i.name] = {}
+    return dir_
+
+
+def _print_tree(dir_: Dict[str:Dict]) -> List[str]:
+    ret = []
+    for name, children in dir_.items():
+        ret.append(name)
+        if not children:
+            continue
+        lines = _print_tree(children)
+        for j, v in enumerate(lines):
+            if v[0] not in ["+", " ", "|"]:
+                ret = _add_line(ret)
+                row = f"+-- {v}"
+            else:
+                row = f"    {v}"
+            ret.append(row)
+    return ret
+
+
+def _add_line(rows: List[str]) -> List[str]:
+    for i in range(len(rows) - 1, -1, -1):
+        v = rows[i]
+        if v[0] != " ":
+            return rows
+        rows[i] = "|" + v[1:]
+    return rows
+
+
+def _execute_tree(root: Path, gitignore: str | Path) -> str:
+    args = ["--gitfile", str(gitignore)] if gitignore else []
+    try:
+        result = subprocess.run(["tree"] + args + [str(root)], capture_output=True, text=True, check=True)
+        if result.returncode != 0:
+            raise ValueError(f"tree exits with code {result.returncode}")
+        return result.stdout
+    except subprocess.CalledProcessError as e:
+        raise e
diff --git a/requirements.txt b/requirements.txt
index c97d4b2f2..83962b21b 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,7 +1,6 @@
-aiohttp==3.8.4
+aiohttp==3.8.6
 #azure_storage==0.37.0
 channels==4.0.0
-# chromadb
 # Django==4.1.5
 # docx==0.2.4
 #faiss==1.5.3
@@ -11,15 +10,13 @@ typer==0.9.0
 # godot==0.1.1
 # google_api_python_client==2.93.0  # Used by search_engine.py
 lancedb==0.4.0
-langchain==0.1.8
-sqlalchemy==2.0.0  # along with langchain
 loguru==0.6.0
 meilisearch==0.21.0
-numpy>=1.24.3,<1.25.0
-openai==1.6.0
+numpy==1.24.3
+openai==1.6.1
 openpyxl
-beautifulsoup4==4.12.2
-pandas==2.0.3
+beautifulsoup4==4.12.3
+pandas==2.1.1
 pydantic==2.5.3
 #pygame==2.1.3
 #pymilvus==2.2.8
@@ -29,8 +26,8 @@ PyYAML==6.0.1
 # sentence_transformers==2.2.2
 setuptools==65.6.3
 tenacity==8.2.3
-tiktoken==0.5.2
-tqdm==4.65.0
+tiktoken==0.6.0
+tqdm==4.66.2
 #unstructured[local-inference]
 # selenium>4
 # webdriver_manager<3.9
@@ -61,9 +58,9 @@ typing-extensions==4.9.0
 socksio~=1.0.0
 gitignore-parser==0.1.9
 # connexion[uvicorn]~=3.0.5 # Used by metagpt/tools/openapi_v3_hello.py
-websockets~=12.0
+websockets~=11.0
 networkx~=3.2.1
-google-generativeai==0.3.2
+google-generativeai==0.4.1
 playwright>=1.26  # used at metagpt/tools/libs/web_scraping.py
 anytree
 ipywidgets==8.1.1
@@ -71,4 +68,5 @@ Pillow
 imap_tools==1.5.0  # Used by metagpt/tools/libs/email_login.py
 qianfan==0.3.2
 dashscope==1.14.1
-rank-bm25==0.2.2  # for tool recommendation
\ No newline at end of file
+rank-bm25==0.2.2  # for tool recommendation
+gymnasium==0.29.1
diff --git a/setup.py b/setup.py
index 2044e577a..8e1ad71c7 100644
--- a/setup.py
+++ b/setup.py
@@ -28,6 +28,17 @@ extras_require = {
     "search-google": ["google-api-python-client==2.94.0"],
     "search-ddg": ["duckduckgo-search~=4.1.1"],
     "ocr": ["paddlepaddle==2.4.2", "paddleocr>=2.0.1", "tabulate==0.9.0"],
+    "rag": [
+        "llama-index-core==0.10.15",
+        "llama-index-embeddings-azure-openai==0.1.6",
+        "llama-index-embeddings-openai==0.1.5",
+        "llama-index-llms-azure-openai==0.1.4",
+        "llama-index-readers-file==0.1.4",
+        "llama-index-retrievers-bm25==0.1.3",
+        "llama-index-vector-stores-faiss==0.1.1",
+        "llama-index-vector-stores-elasticsearch==0.1.6",
+        "llama-index-vector-stores-chroma==0.1.6",
+    ],
 }
 
 extras_require["test"] = [
@@ -42,7 +53,6 @@ extras_require["test"] = [
     "connexion[uvicorn]~=3.0.5",
     "azure-cognitiveservices-speech~=1.31.0",
     "aioboto3~=11.3.0",
-    "chromadb==0.4.14",
     "gradio==3.0.0",
     "grpcio-status==1.48.2",
     "pylint==3.0.3",
@@ -57,7 +67,7 @@ extras_require["dev"] = (["pylint~=3.0.3", "black~=23.3.0", "isort~=5.12.0", "pr
 
 setup(
     name="metagpt",
-    version="0.7.4",
+    version="0.7.6",
     description="The Multi-Agent Framework",
     long_description=long_description,
     long_description_content_type="text/markdown",
@@ -78,4 +88,5 @@ setup(
             "metagpt=metagpt.software_company:app",
         ],
     },
+    include_package_data=True,
 )
diff --git a/tests/conftest.py b/tests/conftest.py
index efd782417..8603c752a 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -113,12 +113,13 @@ def proxy():
         while not reader.at_eof():
             writer.write(await reader.read(2048))
         writer.close()
+        await writer.wait_closed()
 
     async def handle_client(reader, writer):
         data = await reader.readuntil(b"\r\n\r\n")
-        print(f"Proxy: {data}")  # checking with capfd fixture
         infos = pattern.match(data)
         host, port = infos.group("host"), infos.group("port")
+        print(f"Proxy: {host}")  # checking with capfd fixture
         port = int(port) if port else 80
         remote_reader, remote_writer = await asyncio.open_connection(host, port)
         if data.startswith(b"CONNECT"):
@@ -257,10 +258,10 @@ def http_server():
         server = aiohttp.web.Server(handler)
         runner = aiohttp.web.ServerRunner(server)
         await runner.setup()
-        site = aiohttp.web.TCPSite(runner, "localhost", 0)
+        site = aiohttp.web.TCPSite(runner, "127.0.0.1", 0)
         await site.start()
-        host, port = site._server.sockets[0].getsockname()
-        return site, f"http://{host}:{port}"
+        _, port, *_ = site._server.sockets[0].getsockname()
+        return site, f"http://127.0.0.1:{port}"
 
     return start
 
diff --git a/tests/data/rsp_cache.json b/tests/data/rsp_cache.json
index 565241779..772b4d5ed 100644
--- a/tests/data/rsp_cache.json
+++ b/tests/data/rsp_cache.json
@@ -427,5 +427,23 @@
     "As a data scientist, you need to help user to achieve their goal step by step in a continuous Jupyter notebook. Since it is a notebook environment, don't use asyncio.run. Instead, use await if you need to call an async function.#SYSTEM_MSG_END#\n# User Requirement\nRun data analysis on sklearn Wine recognition dataset, include a plot, and train a model to predict wine class (20% as validation), and show validation accuracy.\n\n# Plan Status\n\n## Finished Tasks\n### code\n```python\nimport numpy as np\nimport pandas as pd\nimport matplotlib.pyplot as plt\nfrom sklearn.datasets import load_wine\nwine = load_wine()\nwine_df = pd.DataFrame(data=np.c_[wine['data'], wine['target']],\n                       columns=wine['feature_names'] + ['target'])\nnumerical_summary = wine_df.describe()\ncategorical_summary = wine_df.select_dtypes(include=['object', 'category']).describe()\ncorrelation_matrix = wine_df.corr()\nwine_df.hist(bins=15, figsize=(15, 10), layout=(4, 4))\nplt.tight_layout()\nplt.show()\nprint(\"Numerical Summary:\\n\", numerical_summary)\nprint(\"\\nCategorical Summary:\\n\", categorical_summary)\nprint(\"\\nCorrelation Matrix:\\n\", correlation_matrix)\n\nfrom sklearn.model_selection import train_test_split\nX_train, X_val, y_train, y_val = train_test_split(\n    wine_df.drop('target', axis=1),\n    wine_df['target'],\n    test_size=0.2,\n    random_state=42\n)\nprint(f\"Training set shape: {X_train.shape}\")\nprint(f\"Validation set shape: {X_val.shape}\")\nprint(f\"Training target shape: {y_train.shape}\")\nprint(f\"Validation target shape: {y_val.shape}\")\n\nfrom sklearn.ensemble import RandomForestClassifier\nfrom sklearn.metrics import accuracy_score\nmodel = RandomForestClassifier(n_estimators=100, random_state=42)\nmodel.fit(X_train, y_train)\ny_val_pred = model.predict(X_val)\nval_accuracy = accuracy_score(y_val, y_val_pred)\nprint(f\"Validation Accuracy: {val_accuracy:.4f}\")\n```\n\n### execution result\na successful run\n\na successful run\n\na successful run\n\n## Current Task\nEvaluate the model on the validation set and show the validation accuracy.\n\n## Task Guidance\nWrite complete code for 'Current Task'. And avoid duplicating code from 'Finished Tasks', such as repeated import of packages, reading data, etc.\nSpecifically, \nThe current task is about evaluating a model, please note the following:\n- Ensure that the evaluated data is same processed as the training data. If not, remember use object in 'Done Tasks' to transform the data.\n- Use trained model from previous task result directly, do not mock or reload model yourself.\n\n\n\n# Tool Info\n\n\n# Constraints\n- Take on Current Task if it is in Plan Status, otherwise, tackle User Requirement directly.\n- Ensure the output new code is executable in the same Jupyter notebook as the previous executed code.\n- Always prioritize using pre-defined tools for the same functionality.\n\n# Output\nWhile some concise thoughts are helpful, code is absolutely required. Always output one and only one code block in your response. Output code in the following format:\n```python\nyour code\n```\n": "```python\n# Evaluate the model on the validation set and show the validation accuracy\nval_accuracy = accuracy_score(y_val, y_val_pred)\nprint(f\"Validation Accuracy: {val_accuracy:.4f}\")\n```",
     "user: \n## User Requirement\nRun data analysis on sklearn Wine recognition dataset, include a plot, and train a model to predict wine class (20% as validation), and show validation accuracy.\n## Context\n\n## Current Plan\n[\n    {\n        \"task_id\": \"1\",\n        \"dependent_task_ids\": [],\n        \"instruction\": \"Perform exploratory data analysis on the sklearn Wine recognition dataset including summary statistics and a plot.\",\n        \"task_type\": \"eda\",\n        \"code\": \"import numpy as np\\nimport pandas as pd\\nimport matplotlib.pyplot as plt\\nfrom sklearn.datasets import load_wine\\n\\n# Load the wine dataset\\nwine = load_wine()\\nwine_df = pd.DataFrame(data=np.c_[wine['data'], wine['target']],\\n                       columns=wine['feature_names'] + ['target'])\\n\\n# Summary statistics for numerical features\\nnumerical_summary = wine_df.describe()\\n\\n# Summary statistics for categorical features\\ncategorical_summary = wine_df.select_dtypes(include=['object', 'category']).describe()\\n\\n# Correlation matrix for numerical features\\ncorrelation_matrix = wine_df.corr()\\n\\n# Plotting a histogram for each numerical feature\\nwine_df.hist(bins=15, figsize=(15, 10), layout=(4, 4))\\nplt.tight_layout()\\nplt.show()\\n\\n# Displaying the summary statistics\\nprint(\\\"Numerical Summary:\\\\n\\\", numerical_summary)\\nprint(\\\"\\\\nCategorical Summary:\\\\n\\\", categorical_summary)\\nprint(\\\"\\\\nCorrelation Matrix:\\\\n\\\", correlation_matrix)\\n\",\n        \"result\": \"a successful run\",\n        \"is_success\": true,\n        \"is_finished\": true\n    },\n    {\n        \"task_id\": \"2\",\n        \"dependent_task_ids\": [\n            \"1\"\n        ],\n        \"instruction\": \"Preprocess the dataset by splitting it into training and validation sets with a 80-20 split.\",\n        \"task_type\": \"data preprocessing\",\n        \"code\": \"\",\n        \"result\": \"\",\n        \"is_success\": false,\n        \"is_finished\": false\n    },\n    {\n        \"task_id\": \"3\",\n        \"dependent_task_ids\": [\n            \"2\"\n        ],\n        \"instruction\": \"Train a model using the training set to predict wine class.\",\n        \"task_type\": \"model train\",\n        \"code\": \"\",\n        \"result\": \"\",\n        \"is_success\": false,\n        \"is_finished\": false\n    },\n    {\n        \"task_id\": \"4\",\n        \"dependent_task_ids\": [\n            \"3\"\n        ],\n        \"instruction\": \"Evaluate the model on the validation set and show the validation accuracy.\",\n        \"task_type\": \"model evaluate\",\n        \"code\": \"\",\n        \"result\": \"\",\n        \"is_success\": false,\n        \"is_finished\": false\n    }\n]\n## Current Task\n{\"task_id\":\"2\",\"dependent_task_ids\":[\"1\"],\"instruction\":\"Preprocess the dataset by splitting it into training and validation sets with a 80-20 split.\",\"task_type\":\"data preprocessing\",\"code\":\"\",\"result\":\"\",\"is_success\":false,\"is_finished\":false}\n\nuser: \n# Latest Data Info\nLatest data info after previous tasks:\na successful run\n\nassistant: from sklearn.model_selection import train_test_split\n\n# Split the data into training and validation sets (80-20 split)\nX_train, X_val, y_train, y_val = train_test_split(\n    wine_df.drop('target', axis=1),  # features\n    wine_df['target'],               # target variable\n    test_size=0.2,                   # 20% for validation\n    random_state=42                  # seed for reproducibility\n)\n\n# Output the shapes of the resulting data splits\nprint(f\"Training set shape: {X_train.shape}\")\nprint(f\"Validation set shape: {X_val.shape}\")\nprint(f\"Training target shape: {y_train.shape}\")\nprint(f\"Validation target shape: {y_val.shape}\")\n\nuser: a successful runThis is a <task> review. Please review output from metagpt.actions.di.execute_nb_code.ExecuteNbCode\nIf you want to change, add, delete a task or merge tasks in the plan, say 'change task task_id or current task, ... (things to change)' If you confirm the output from the current task and wish to continue, type: confirmIf you think user requirement has been fulfilled completedly, you can finish the process by typing: finish\nIf you want to terminate the process, type: exit\nPlease type your review below:\n": "confirm",
     "user: \n## User Requirement\nRun data analysis on sklearn Wine recognition dataset, include a plot, and train a model to predict wine class (20% as validation), and show validation accuracy.\n## Context\n\n## Current Plan\n[\n    {\n        \"task_id\": \"1\",\n        \"dependent_task_ids\": [],\n        \"instruction\": \"Perform exploratory data analysis on the sklearn Wine recognition dataset including summary statistics and a plot.\",\n        \"task_type\": \"eda\",\n        \"code\": \"import numpy as np\\nimport pandas as pd\\nimport matplotlib.pyplot as plt\\nfrom sklearn.datasets import load_wine\\n\\n# Load the wine dataset\\nwine = load_wine()\\nwine_df = pd.DataFrame(data=np.c_[wine['data'], wine['target']],\\n                       columns=wine['feature_names'] + ['target'])\\n\\n# Summary statistics for numerical features\\nnumerical_summary = wine_df.describe()\\n\\n# Summary statistics for categorical features\\ncategorical_summary = wine_df.select_dtypes(include=['object', 'category']).describe()\\n\\n# Correlation matrix for numerical features\\ncorrelation_matrix = wine_df.corr()\\n\\n# Plotting a histogram for each numerical feature\\nwine_df.hist(bins=15, figsize=(15, 10), layout=(4, 4))\\nplt.tight_layout()\\nplt.show()\\n\\n# Displaying the summary statistics\\nprint(\\\"Numerical Summary:\\\\n\\\", numerical_summary)\\nprint(\\\"\\\\nCategorical Summary:\\\\n\\\", categorical_summary)\\nprint(\\\"\\\\nCorrelation Matrix:\\\\n\\\", correlation_matrix)\\n\",\n        \"result\": \"a successful run\",\n        \"is_success\": true,\n        \"is_finished\": true\n    },\n    {\n        \"task_id\": \"2\",\n        \"dependent_task_ids\": [\n            \"1\"\n        ],\n        \"instruction\": \"Preprocess the dataset by splitting it into training and validation sets with a 80-20 split.\",\n        \"task_type\": \"data preprocessing\",\n        \"code\": \"from sklearn.model_selection import train_test_split\\n\\n# Split the data into training and validation sets (80-20 split)\\nX_train, X_val, y_train, y_val = train_test_split(\\n    wine_df.drop('target', axis=1),  # features\\n    wine_df['target'],               # target variable\\n    test_size=0.2,                   # 20% for validation\\n    random_state=42                  # seed for reproducibility\\n)\\n\\n# Output the shapes of the resulting data splits\\nprint(f\\\"Training set shape: {X_train.shape}\\\")\\nprint(f\\\"Validation set shape: {X_val.shape}\\\")\\nprint(f\\\"Training target shape: {y_train.shape}\\\")\\nprint(f\\\"Validation target shape: {y_val.shape}\\\")\\n\",\n        \"result\": \"a successful run\",\n        \"is_success\": true,\n        \"is_finished\": true\n    },\n    {\n        \"task_id\": \"3\",\n        \"dependent_task_ids\": [\n            \"2\"\n        ],\n        \"instruction\": \"Train a model using the training set to predict wine class.\",\n        \"task_type\": \"model train\",\n        \"code\": \"\",\n        \"result\": \"\",\n        \"is_success\": false,\n        \"is_finished\": false\n    },\n    {\n        \"task_id\": \"4\",\n        \"dependent_task_ids\": [\n            \"3\"\n        ],\n        \"instruction\": \"Evaluate the model on the validation set and show the validation accuracy.\",\n        \"task_type\": \"model evaluate\",\n        \"code\": \"\",\n        \"result\": \"\",\n        \"is_success\": false,\n        \"is_finished\": false\n    }\n]\n## Current Task\n{\"task_id\":\"3\",\"dependent_task_ids\":[\"2\"],\"instruction\":\"Train a model using the training set to predict wine class.\",\"task_type\":\"model train\",\"code\":\"\",\"result\":\"\",\"is_success\":false,\"is_finished\":false}\n\nuser: \n# Latest Data Info\nLatest data info after previous tasks:\na successful run\n\nassistant: from sklearn.ensemble import RandomForestClassifier\nfrom sklearn.metrics import accuracy_score\n\n# Initialize the RandomForestClassifier\nmodel = RandomForestClassifier(n_estimators=100, random_state=42)\n\n# Train the model on the training data\nmodel.fit(X_train, y_train)\n\n# Predict the wine classes on the validation set\ny_val_pred = model.predict(X_val)\n\n# Calculate the accuracy on the validation set\nval_accuracy = accuracy_score(y_val, y_val_pred)\n\nprint(f\"Validation Accuracy: {val_accuracy:.4f}\")\n\nuser: a successful runThis is a <task> review. Please review output from metagpt.actions.di.execute_nb_code.ExecuteNbCode\nIf you want to change, add, delete a task or merge tasks in the plan, say 'change task task_id or current task, ... (things to change)' If you confirm the output from the current task and wish to continue, type: confirmIf you think user requirement has been fulfilled completedly, you can finish the process by typing: finish\nIf you want to terminate the process, type: exit\nPlease type your review below:\n": "confirm",
-    "user: \n## User Requirement\nRun data analysis on sklearn Wine recognition dataset, include a plot, and train a model to predict wine class (20% as validation), and show validation accuracy.\n## Context\n\n## Current Plan\n[\n    {\n        \"task_id\": \"1\",\n        \"dependent_task_ids\": [],\n        \"instruction\": \"Perform exploratory data analysis on the sklearn Wine recognition dataset including summary statistics and a plot.\",\n        \"task_type\": \"eda\",\n        \"code\": \"import numpy as np\\nimport pandas as pd\\nimport matplotlib.pyplot as plt\\nfrom sklearn.datasets import load_wine\\n\\n# Load the wine dataset\\nwine = load_wine()\\nwine_df = pd.DataFrame(data=np.c_[wine['data'], wine['target']],\\n                       columns=wine['feature_names'] + ['target'])\\n\\n# Summary statistics for numerical features\\nnumerical_summary = wine_df.describe()\\n\\n# Summary statistics for categorical features\\ncategorical_summary = wine_df.select_dtypes(include=['object', 'category']).describe()\\n\\n# Correlation matrix for numerical features\\ncorrelation_matrix = wine_df.corr()\\n\\n# Plotting a histogram for each numerical feature\\nwine_df.hist(bins=15, figsize=(15, 10), layout=(4, 4))\\nplt.tight_layout()\\nplt.show()\\n\\n# Displaying the summary statistics\\nprint(\\\"Numerical Summary:\\\\n\\\", numerical_summary)\\nprint(\\\"\\\\nCategorical Summary:\\\\n\\\", categorical_summary)\\nprint(\\\"\\\\nCorrelation Matrix:\\\\n\\\", correlation_matrix)\\n\",\n        \"result\": \"a successful run\",\n        \"is_success\": true,\n        \"is_finished\": true\n    },\n    {\n        \"task_id\": \"2\",\n        \"dependent_task_ids\": [\n            \"1\"\n        ],\n        \"instruction\": \"Preprocess the dataset by splitting it into training and validation sets with a 80-20 split.\",\n        \"task_type\": \"data preprocessing\",\n        \"code\": \"from sklearn.model_selection import train_test_split\\n\\n# Split the data into training and validation sets (80-20 split)\\nX_train, X_val, y_train, y_val = train_test_split(\\n    wine_df.drop('target', axis=1),  # features\\n    wine_df['target'],               # target variable\\n    test_size=0.2,                   # 20% for validation\\n    random_state=42                  # seed for reproducibility\\n)\\n\\n# Output the shapes of the resulting data splits\\nprint(f\\\"Training set shape: {X_train.shape}\\\")\\nprint(f\\\"Validation set shape: {X_val.shape}\\\")\\nprint(f\\\"Training target shape: {y_train.shape}\\\")\\nprint(f\\\"Validation target shape: {y_val.shape}\\\")\\n\",\n        \"result\": \"a successful run\",\n        \"is_success\": true,\n        \"is_finished\": true\n    },\n    {\n        \"task_id\": \"3\",\n        \"dependent_task_ids\": [\n            \"2\"\n        ],\n        \"instruction\": \"Train a model using the training set to predict wine class.\",\n        \"task_type\": \"model train\",\n        \"code\": \"from sklearn.ensemble import RandomForestClassifier\\nfrom sklearn.metrics import accuracy_score\\n\\n# Initialize the RandomForestClassifier\\nmodel = RandomForestClassifier(n_estimators=100, random_state=42)\\n\\n# Train the model on the training data\\nmodel.fit(X_train, y_train)\\n\\n# Predict the wine classes on the validation set\\ny_val_pred = model.predict(X_val)\\n\\n# Calculate the accuracy on the validation set\\nval_accuracy = accuracy_score(y_val, y_val_pred)\\n\\nprint(f\\\"Validation Accuracy: {val_accuracy:.4f}\\\")\\n\",\n        \"result\": \"a successful run\",\n        \"is_success\": true,\n        \"is_finished\": true\n    },\n    {\n        \"task_id\": \"4\",\n        \"dependent_task_ids\": [\n            \"3\"\n        ],\n        \"instruction\": \"Evaluate the model on the validation set and show the validation accuracy.\",\n        \"task_type\": \"model evaluate\",\n        \"code\": \"\",\n        \"result\": \"\",\n        \"is_success\": false,\n        \"is_finished\": false\n    }\n]\n## Current Task\n{\"task_id\":\"4\",\"dependent_task_ids\":[\"3\"],\"instruction\":\"Evaluate the model on the validation set and show the validation accuracy.\",\"task_type\":\"model evaluate\",\"code\":\"\",\"result\":\"\",\"is_success\":false,\"is_finished\":false}\n\nassistant: # Evaluate the model on the validation set and show the validation accuracy\nval_accuracy = accuracy_score(y_val, y_val_pred)\nprint(f\"Validation Accuracy: {val_accuracy:.4f}\")\n\nuser: a successful runThis is a <task> review. Please review output from metagpt.actions.di.execute_nb_code.ExecuteNbCode\nIf you want to change, add, delete a task or merge tasks in the plan, say 'change task task_id or current task, ... (things to change)' If you confirm the output from the current task and wish to continue, type: confirmIf you think user requirement has been fulfilled completedly, you can finish the process by typing: finish\nIf you want to terminate the process, type: exit\nPlease type your review below:\n": "confirm"
+    "user: \n## User Requirement\nRun data analysis on sklearn Wine recognition dataset, include a plot, and train a model to predict wine class (20% as validation), and show validation accuracy.\n## Context\n\n## Current Plan\n[\n    {\n        \"task_id\": \"1\",\n        \"dependent_task_ids\": [],\n        \"instruction\": \"Perform exploratory data analysis on the sklearn Wine recognition dataset including summary statistics and a plot.\",\n        \"task_type\": \"eda\",\n        \"code\": \"import numpy as np\\nimport pandas as pd\\nimport matplotlib.pyplot as plt\\nfrom sklearn.datasets import load_wine\\n\\n# Load the wine dataset\\nwine = load_wine()\\nwine_df = pd.DataFrame(data=np.c_[wine['data'], wine['target']],\\n                       columns=wine['feature_names'] + ['target'])\\n\\n# Summary statistics for numerical features\\nnumerical_summary = wine_df.describe()\\n\\n# Summary statistics for categorical features\\ncategorical_summary = wine_df.select_dtypes(include=['object', 'category']).describe()\\n\\n# Correlation matrix for numerical features\\ncorrelation_matrix = wine_df.corr()\\n\\n# Plotting a histogram for each numerical feature\\nwine_df.hist(bins=15, figsize=(15, 10), layout=(4, 4))\\nplt.tight_layout()\\nplt.show()\\n\\n# Displaying the summary statistics\\nprint(\\\"Numerical Summary:\\\\n\\\", numerical_summary)\\nprint(\\\"\\\\nCategorical Summary:\\\\n\\\", categorical_summary)\\nprint(\\\"\\\\nCorrelation Matrix:\\\\n\\\", correlation_matrix)\\n\",\n        \"result\": \"a successful run\",\n        \"is_success\": true,\n        \"is_finished\": true\n    },\n    {\n        \"task_id\": \"2\",\n        \"dependent_task_ids\": [\n            \"1\"\n        ],\n        \"instruction\": \"Preprocess the dataset by splitting it into training and validation sets with a 80-20 split.\",\n        \"task_type\": \"data preprocessing\",\n        \"code\": \"from sklearn.model_selection import train_test_split\\n\\n# Split the data into training and validation sets (80-20 split)\\nX_train, X_val, y_train, y_val = train_test_split(\\n    wine_df.drop('target', axis=1),  # features\\n    wine_df['target'],               # target variable\\n    test_size=0.2,                   # 20% for validation\\n    random_state=42                  # seed for reproducibility\\n)\\n\\n# Output the shapes of the resulting data splits\\nprint(f\\\"Training set shape: {X_train.shape}\\\")\\nprint(f\\\"Validation set shape: {X_val.shape}\\\")\\nprint(f\\\"Training target shape: {y_train.shape}\\\")\\nprint(f\\\"Validation target shape: {y_val.shape}\\\")\\n\",\n        \"result\": \"a successful run\",\n        \"is_success\": true,\n        \"is_finished\": true\n    },\n    {\n        \"task_id\": \"3\",\n        \"dependent_task_ids\": [\n            \"2\"\n        ],\n        \"instruction\": \"Train a model using the training set to predict wine class.\",\n        \"task_type\": \"model train\",\n        \"code\": \"from sklearn.ensemble import RandomForestClassifier\\nfrom sklearn.metrics import accuracy_score\\n\\n# Initialize the RandomForestClassifier\\nmodel = RandomForestClassifier(n_estimators=100, random_state=42)\\n\\n# Train the model on the training data\\nmodel.fit(X_train, y_train)\\n\\n# Predict the wine classes on the validation set\\ny_val_pred = model.predict(X_val)\\n\\n# Calculate the accuracy on the validation set\\nval_accuracy = accuracy_score(y_val, y_val_pred)\\n\\nprint(f\\\"Validation Accuracy: {val_accuracy:.4f}\\\")\\n\",\n        \"result\": \"a successful run\",\n        \"is_success\": true,\n        \"is_finished\": true\n    },\n    {\n        \"task_id\": \"4\",\n        \"dependent_task_ids\": [\n            \"3\"\n        ],\n        \"instruction\": \"Evaluate the model on the validation set and show the validation accuracy.\",\n        \"task_type\": \"model evaluate\",\n        \"code\": \"\",\n        \"result\": \"\",\n        \"is_success\": false,\n        \"is_finished\": false\n    }\n]\n## Current Task\n{\"task_id\":\"4\",\"dependent_task_ids\":[\"3\"],\"instruction\":\"Evaluate the model on the validation set and show the validation accuracy.\",\"task_type\":\"model evaluate\",\"code\":\"\",\"result\":\"\",\"is_success\":false,\"is_finished\":false}\n\nassistant: # Evaluate the model on the validation set and show the validation accuracy\nval_accuracy = accuracy_score(y_val, y_val_pred)\nprint(f\"Validation Accuracy: {val_accuracy:.4f}\")\n\nuser: a successful runThis is a <task> review. Please review output from metagpt.actions.di.execute_nb_code.ExecuteNbCode\nIf you want to change, add, delete a task or merge tasks in the plan, say 'change task task_id or current task, ... (things to change)' If you confirm the output from the current task and wish to continue, type: confirmIf you think user requirement has been fulfilled completedly, you can finish the process by typing: finish\nIf you want to terminate the process, type: exit\nPlease type your review below:\n": "confirm",
+    "\"\"\"\nGiven only the information above, what are 3 most salient high-level questions we can answer about the subjects grounded in the statements?\n1)\n\"\"\"\nOutput the response to the prompt above in json. Output must be a list of str.\nExample output json:\n{\"output\": \"[\"What should Jane do for lunch\", \"Does Jane like strawberry\", \"Who is Jane\"]\"}": "{\n  \"output\": [\n    \"What is the significance of the information provided?\",\n    \"What are the implications of Jane's preferences?\",\n    \"How does the information relate to the subject's identity?\"\n  ]\n}",
+    "Input:\n[user: Klaus Mueller has a close relationship with Maria Lopez, user:s Mueller and Maria Lopez have a close relationship, user: Klaus Mueller has a close relationship with Maria Lopez, user: Klaus Mueller has a close relationship with Maria Lopez, user: Klaus Mueller and Maria Lopez have a strong relationship, user: Klaus Mueller is a dormmate of Maria Lopez., user: Klaus Mueller and Maria Lopez have a strong bond, user: Klaus Mueller has a crush on Maria Lopez, user: Klaus Mueller and Maria Lopez have been friends for more than 2 years., user: Klaus Mueller has a close relationship with Maria Lopez, user: Klaus Mueller Maria Lopez is heading off to college., user: Klaus Mueller and Maria Lopez have a close relationship, user: Klaus Mueller is actively researching a topic, user: Klaus Mueller is close friends and classmates with Maria Lopez., user: Klaus Mueller is socially active, user: Klaus Mueller has a crush on Maria Lopez., user: Klaus Mueller and Maria Lopez have been friends for a long time, user: Klaus Mueller is academically inclined, user: For Klaus Mueller's planning: should remember to ask Maria Lopez about her research paper, as she found it interesting that he mentioned it., user: Klaus Mueller is acquainted with Isabella Rodriguez, user: Klaus Mueller is organized and prepared, user: Maria Lopez is conversing about conversing about Maria's research paper mentioned by Klaus, user: Klaus Mueller is conversing about conversing about Maria's research paper mentioned by Klaus, user: Klaus Mueller is a student, user: Klaus Mueller is a student, user: Klaus Mueller is conversing about two friends named Klaus Mueller and Maria Lopez discussing their morning plans and progress on a research paper before Maria heads off to college., user: Klaus Mueller is socially active, user: Klaus Mueller is socially active, user: Klaus Mueller is socially active and acquainted with Isabella Rodriguez, user: Klaus Mueller has a crush on Maria Lopez]\n\nWhat 5 high-level insights can you infer from the above statements? Please ensure it includes 'because of' and generates according to the example format.(example format: insight (because of 1, 5, 3)) .\n1.": "It seems that Klaus Mueller has a strong and close relationship with Maria Lopez because they have been friends for more than 2 years, are dormmates, and have a strong bond.\n2. Klaus Mueller is academically inclined and actively researching a topic because he is conversing about Maria's research paper and is organized and prepared.\n3. Klaus Mueller has a crush on Maria Lopez, which is evident from his repeated mention of their close relationship and his interest in her research paper.\n4. Klaus Mueller is socially active and acquainted with Isabella Rodriguez, as he is conversing about two friends discussing their morning plans and progress on a research paper before Maria heads off to college.\n5. Maria Lopez and Klaus Mueller are conversing about their morning plans and",
+    "Task: Turn the input into (subject, predicate, object). \n\nInput: Sam Johnson is eating breakfast. \nOutput: (Dolores Murphy, eat, breakfast) \n--- \nInput: Joon Park is brewing coffee.\nOutput: (Joon Park, brew, coffee)\n---\nInput: Jane Cook is sleeping. \nOutput: (Jane Cook, is, sleep)\n---\nInput: Michael Bernstein is writing email on a computer. \nOutput: (Michael Bernstein, write, email)\n---\nInput: Percy Liang is teaching students in a classroom. \nOutput: (Percy Liang, teach, students)\n---\nInput: Merrie Morris is running on a treadmill. \nOutput: (Merrie Morris, run, treadmill)\n---\nInput: Klaus Mueller is Klaus Mueller is academically inclined. \nOutput: (Klaus Mueller,": "I'm sorry, but the input \"Klaus Mueller is Klaus Mueller is academically inclined.\" seems to be incomplete or incorrect. Could you please",
+    "\"\"\"\nConversation: \nRole_A: \"what's the weather today?\"\nRole_B: \"It looks pretty good, and I will take a walk then.\"\n\n\nSummarize the conversation above in one sentence:\nThis is a conversation about\n\"\"\"\nOutput the response to the prompt above in json. The output must continue the sentence above by filling in the <fill in> tag. Don't start with 'this is a conversation about...' Just finish the sentence but do not miss any important details (including who are chatting).\nExample output json:\n{\"output\": \"conversing about what to eat for lunch\"}": "{\"output\": \"the weather and plans for a walk\"}",
+    "\"\"\"\n[Statements]\n\n\nBased on the statements above, summarize Isabella Rodriguez and Klaus Mueller's relationship. What do they feel or know about each other?\n\n\n\"\n\"\"\"\nOutput the response to the prompt above in json. The output should be a string that responds to the question.\nExample output json:\n{\"output\": \"Jane Doe is working on a project\"}": "{\"output\": \"Isabella Rodriguez and Klaus Mueller have a close working relationship and seem to have a good understanding of each other's strengths and weaknesses. They trust each other and are comfortable sharing their thoughts and ideas.\"}",
+    "Context for the task: \n\nPART 1. \nHere is Here is a brief description of Isabella Rodriguez.\nName: Isabella Rodriguez\nAge: 34\nInnate traits: friendly, outgoing, hospitable\nLearned traits: Isabella Rodriguez is a cafe owner of Hobbs Cafe who loves to make people feel welcome. She is always looking for ways to make the cafe a place where people can come to relax and enjoy themselves.\nCurrently: Isabella Rodriguez is planning on having a Valentine's Day party at Hobbs Cafe with her customers on February 14th, 2023 at 5pm. She is gathering party material, and is telling everyone to join the party at Hobbs Cafe on February 14th, 2023, from 5pm to 7pm.\nLifestyle: Isabella Rodriguez goes to bed around 11pm, awakes up around 6am.\nDaily plan requirement: Isabella Rodriguez opens Hobbs Cafe at 8am everyday, and works at the counter until 8pm, at which point she closes the cafe.\nCurrent Date: \n\n\nHere is the memory that is in Isabella Rodriguez's head: \n\n\nPART 2. \nPast Context: \n\n\nCurrent Location: main room in Isabella Rodriguez's apartment\n\nCurrent Context: \nIsabella Rodriguez was None when Isabella Rodriguez saw Klaus Mueller in the middle of None.\nIsabella Rodriguez is initiating a conversation with Klaus Mueller.\n\nIsabella Rodriguez and Klaus Mueller are chatting. Here is their conversation so far: \n[The conversation has not started yet -- start it!]\n\n---\nTask: Given the above, what should Isabella Rodriguez say to Klaus Mueller next in the conversation? And did it end the conversation?\n\nOutput format: Output a json of the following format: \n{\n\"Isabella Rodriguez\": \"<Isabella Rodriguez's utterance>\",\n\"Did the conversation end with Isabella Rodriguez's utterance?\": \"<json Boolean>\"\n}": "{\n  \"Isabella Rodriguez\": \"Hey Klaus, I'm so glad you stopped by! I'm getting everything ready for our Valentine's Day party at Hobbs Cafe. I hope you can make it on February 14th at 5pm. It's going to be a great time with music, food, and fun activities. I'd love to see you there!\",\n  \"Did the conversation end with Isabella Rodriguez's utterance?\": \"false\"\n}",
+    "\"\"\"\n[Statements]\n\n\nBased on the statements above, summarize Klaus Mueller and Isabella Rodriguez's relationship. What do they feel or know about each other?\n\n\n\"\n\"\"\"\nOutput the response to the prompt above in json. The output should be a string that responds to the question.\nExample output json:\n{\"output\": \"Jane Doe is working on a project\"}": "{\"output\": \"Klaus Mueller and Isabella Rodriguez have a professional relationship, and they seem to have mutual respect for each other's work. They have collaborated on several projects and have a good understanding of each other's expertise.\"}",
+    "Context for the task: \n\nPART 1. \nHere is Here is a brief description of Klaus Mueller.\nName: Klaus Mueller\nAge: 20\nInnate traits: kind, inquisitive, passionate\nLearned traits: Klaus Mueller is a student at Oak Hill College studying sociology. He is passionate about social justice and loves to explore different perspectives.\nCurrently: Klaus Mueller is writing a research paper on the effects of gentrification in low-income communities.\nLifestyle: Klaus Mueller goes to bed around 11pm, awakes up around 7am, eats dinner around 5pm.\nDaily plan requirement: Klaus Mueller goes to the library at Oak Hill College early in the morning, spends his days writing, and eats at Hobbs Cafe.\nCurrent Date: \n\n\nHere is the memory that is in Klaus Mueller's head: \n\n\nPART 2. \nPast Context: \n\n\nCurrent Location: Klaus Mueller's room in Dorm for Oak Hill College\n\nCurrent Context: \nKlaus Mueller was None when Klaus Mueller saw Isabella Rodriguez in the middle of None.\nKlaus Mueller is initiating a conversation with Isabella Rodriguez.\n\nKlaus Mueller and Isabella Rodriguez are chatting. Here is their conversation so far: \nIsabella Rodriguez: Hey Klaus, I'm so glad you stopped by! I'm getting everything ready for our Valentine's Day party at Hobbs Cafe. I hope you can make it on February 14th at 5pm. It's going to be a great time with music, food, and fun activities. I'd love to see you there!\n\n\n---\nTask: Given the above, what should Klaus Mueller say to Isabella Rodriguez next in the conversation? And did it end the conversation?\n\nOutput format: Output a json of the following format: \n{\n\"Klaus Mueller\": \"<Klaus Mueller's utterance>\",\n\"Did the conversation end with Klaus Mueller's utterance?\": \"<json Boolean>\"\n}": "{\n  \"Klaus Mueller\": \"Hey Isabella, that sounds like a fantastic event! I'll definitely be there on February 14th at 5pm. Thanks for inviting me!\",\n  \"Did the conversation end with Klaus Mueller's utterance?\": \"false\"\n}",
+    "Context for the task: \n\nPART 1. \nHere is Here is a brief description of Isabella Rodriguez.\nName: Isabella Rodriguez\nAge: 34\nInnate traits: friendly, outgoing, hospitable\nLearned traits: Isabella Rodriguez is a cafe owner of Hobbs Cafe who loves to make people feel welcome. She is always looking for ways to make the cafe a place where people can come to relax and enjoy themselves.\nCurrently: Isabella Rodriguez is planning on having a Valentine's Day party at Hobbs Cafe with her customers on February 14th, 2023 at 5pm. She is gathering party material, and is telling everyone to join the party at Hobbs Cafe on February 14th, 2023, from 5pm to 7pm.\nLifestyle: Isabella Rodriguez goes to bed around 11pm, awakes up around 6am.\nDaily plan requirement: Isabella Rodriguez opens Hobbs Cafe at 8am everyday, and works at the counter until 8pm, at which point she closes the cafe.\nCurrent Date: \n\n\nHere is the memory that is in Isabella Rodriguez's head: \n\n\nPART 2. \nPast Context: \n\n\nCurrent Location: main room in Isabella Rodriguez's apartment\n\nCurrent Context: \nIsabella Rodriguez was None when Isabella Rodriguez saw Klaus Mueller in the middle of None.\nIsabella Rodriguez is initiating a conversation with Klaus Mueller.\n\nIsabella Rodriguez and Klaus Mueller are chatting. Here is their conversation so far: \nIsabella Rodriguez: Hey Klaus, I'm so glad you stopped by! I'm getting everything ready for our Valentine's Day party at Hobbs Cafe. I hope you can make it on February 14th at 5pm. It's going to be a great time with music, food, and fun activities. I'd love to see you there!\nKlaus Mueller: Hey Isabella, that sounds like a fantastic event! I'll definitely be there on February 14th at 5pm. Thanks for inviting me!\n\n\n---\nTask: Given the above, what should Isabella Rodriguez say to Klaus Mueller next in the conversation? And did it end the conversation?\n\nOutput format: Output a json of the following format: \n{\n\"Isabella Rodriguez\": \"<Isabella Rodriguez's utterance>\",\n\"Did the conversation end with Isabella Rodriguez's utterance?\": \"<json Boolean>\"\n}": "{\n  \"Isabella Rodriguez\": \"Great! I'm looking forward to seeing you there. I'll make sure to save you a seat. Thanks for stopping by, Klaus!\",\n  \"Did the conversation end with Isabella Rodriguez's utterance?\": \"false\"\n}",
+    "Context for the task: \n\nPART 1. \nHere is Here is a brief description of Klaus Mueller.\nName: Klaus Mueller\nAge: 20\nInnate traits: kind, inquisitive, passionate\nLearned traits: Klaus Mueller is a student at Oak Hill College studying sociology. He is passionate about social justice and loves to explore different perspectives.\nCurrently: Klaus Mueller is writing a research paper on the effects of gentrification in low-income communities.\nLifestyle: Klaus Mueller goes to bed around 11pm, awakes up around 7am, eats dinner around 5pm.\nDaily plan requirement: Klaus Mueller goes to the library at Oak Hill College early in the morning, spends his days writing, and eats at Hobbs Cafe.\nCurrent Date: \n\n\nHere is the memory that is in Klaus Mueller's head: \n\n\nPART 2. \nPast Context: \n\n\nCurrent Location: Klaus Mueller's room in Dorm for Oak Hill College\n\nCurrent Context: \nKlaus Mueller was None when Klaus Mueller saw Isabella Rodriguez in the middle of None.\nKlaus Mueller is initiating a conversation with Isabella Rodriguez.\n\nKlaus Mueller and Isabella Rodriguez are chatting. Here is their conversation so far: \nIsabella Rodriguez: Hey Klaus, I'm so glad you stopped by! I'm getting everything ready for our Valentine's Day party at Hobbs Cafe. I hope you can make it on February 14th at 5pm. It's going to be a great time with music, food, and fun activities. I'd love to see you there!\nKlaus Mueller: Hey Isabella, that sounds like a fantastic event! I'll definitely be there on February 14th at 5pm. Thanks for inviting me!\nIsabella Rodriguez: Great! I'm looking forward to seeing you there. I'll make sure to save you a seat. Thanks for stopping by, Klaus!\n\n\n---\nTask: Given the above, what should Klaus Mueller say to Isabella Rodriguez next in the conversation? And did it end the conversation?\n\nOutput format: Output a json of the following format: \n{\n\"Klaus Mueller\": \"<Klaus Mueller's utterance>\",\n\"Did the conversation end with Klaus Mueller's utterance?\": \"<json Boolean>\"\n}": "{\n  \"Klaus Mueller\": \"Isabella, I'm really interested in your work with the community. I'd love to hear more about it sometime.\",\n  \"Did the conversation end with Klaus Mueller's utterance?\": \"false\"\n}",
+    "Task -- choose an appropriate area  from the area options for a task at hand. \n\nSam Kim lives in {Sam Kim's house} that has Sam Kim's room, bathroom, kitchen.\nSam Kim is currently in {Sam Kim's house} that has Sam Kim's room, bathroom, kitchen. \nArea options: {Sam Kim's house, The Rose and Crown Pub, Hobbs Cafe, Oak Hill College, Johnson Park, Harvey Oak Supply Store, The Willows Market and Pharmacy}.\n* Stay in the current area if the activity can be done there. Only go out if the activity needs to take place in another place.\n* Must be one of the \"Area options,\" verbatim.\nFor taking a walk, Sam Kim should go to the following area: {Johnson Park}\n---\nJane Anderson lives in {Oak Hill College Student Dormatory} that has Jane Anderson's room.\nJane Anderson is currently in {Oak Hill College} that has a classroom, library\nArea options: {Oak Hill College Student Dormatory, The Rose and Crown Pub, Hobbs Cafe, Oak Hill College, Johnson Park, Harvey Oak Supply Store, The Willows Market and Pharmacy}. \n* Stay in the current area if the activity can be done there. Only go out if the activity needs to take place in another place.\n* Must be one of the \"Area options,\" verbatim.\nFor eating dinner, Jane Anderson should go to the following area: {Hobbs Cafe}\n---\nHobbs Cafe lives in {Klaus Mueller} that has sleeping.\nsleeping is currently in {Klaus Mueller} that has !<INPUT 5>!. !<INPUT 6>!\nArea options: {!<INPUT 7>!}. \n* Stay in the current area if the activity can be done there. Only go out if the activity needs to take place in another place.\n* Must be one of the \"Area options,\" verbatim.\n!<INPUT 8>! is !<INPUT 9>!. For !<INPUT 10>!, !<INPUT 11>! should go to the following area: {": "For sleeping, Hobbs Cafe should go to the following area: {K",
+    "Jane Anderson is in kitchen in Jane Anderson's house.\nJane Anderson is going to Jane Anderson's house that has the following areas: {kitchen,  bedroom, bathroom}\nStay in the current area if the activity can be done there. Never go into other people's rooms unless necessary.\nFor cooking, Jane Anderson should go to the following area in Jane Anderson's house:\nAnswer: {kitchen}\n---\nTom Watson is in common room in Tom Watson's apartment. \nTom Watson is going to Hobbs Cafe that has the following areas: {cafe}\nStay in the current area if the activity can be done there. Never go into other people's rooms unless necessary.\nFor getting coffee, Tom Watson should go to the following area in Hobbs Cafe:\nAnswer: {cafe}\n---\n\nKlaus Mueller is going to Dorm for Oak Hill College that has the following areas: {garden, Klaus Mueller's room, woman's bathroom, common room, man's bathroom}\n* Stay in the current area if the activity can be done there. \n* NEVER go into other people's rooms unless necessary.\nKlaus Mueller is sleeping. For sleeping, Klaus Mueller should go to the following area in Dorm for Oak Hill College (MUST pick one of {garden, Klaus Mueller's room, woman's bathroom, common room, man's bathroom}):\nAnswer: {": "Klaus Mueller's room}",
+    "Current activity: sleep in bed\nObjects available: {bed, easel, closet, painting}\nPick ONE most relevant object from the objects available: bed\n---\nCurrent activity: painting\nObjects available: {easel, closet, sink, microwave}\nPick ONE most relevant object from the objects available: easel\n---\nCurrent activity: cooking\nObjects available: {stove, sink, fridge, counter}\nPick ONE most relevant object from the objects available: stove\n---\nCurrent activity: watch TV\nObjects available: {couch, TV, remote, coffee table}\nPick ONE most relevant object from the objects available: TV\n---\nCurrent activity: study\nObjects available: {desk, computer, chair, bookshelf}\nPick ONE most relevant object from the objects available: desk\n---\nCurrent activity: talk on the phone\nObjects available: {phone, charger, bed, nightstand}\nPick ONE most relevant object from the objects available: phone\n---\nCurrent activity: sleeping\nObjects available: {bed, game console, closet, desk}\nPick ONE most relevant object from the objects available:": "bed",
+    "\"\"\"\nTask: We want to understand the state of an object that is being used by someone. \n\nLet's think step by step. \nWe want to know about bed's state. \nStep 1. Klaus Mueller is at/using the sleeping.\nStep 2. Describe the bed's state: bed is\n\"\"\"\nOutput the response to the prompt above in json. The output should ONLY contain the phrase that should go in <fill in>.\nExample output json:\n{\"output\": \"being fixed\"}": "{\n    \"output\": \"being used\"\n}",
+    "\"\"\"\nConvert an action description to an emoji (important: use two or less emojis).\n\nAction description: sleeping\nEmoji:\n\"\"\"\nOutput the response to the prompt above in json. The value for the output must ONLY contain the emojis.\nExample output json:\n{\"output\": \"🛁🧖‍♀️\"}": "{\n    \"output\": \"😴\"\n}",
+    "Task: Turn the input into (subject, predicate, object). \n\nInput: Sam Johnson is eating breakfast. \nOutput: (Dolores Murphy, eat, breakfast) \n--- \nInput: Joon Park is brewing coffee.\nOutput: (Joon Park, brew, coffee)\n---\nInput: Jane Cook is sleeping. \nOutput: (Jane Cook, is, sleep)\n---\nInput: Michael Bernstein is writing email on a computer. \nOutput: (Michael Bernstein, write, email)\n---\nInput: Percy Liang is teaching students in a classroom. \nOutput: (Percy Liang, teach, students)\n---\nInput: Merrie Morris is running on a treadmill. \nOutput: (Merrie Morris, run, treadmill)\n---\nInput: Klaus Mueller is sleeping. \nOutput: (Klaus Mueller,": "I'm sorry, but it seems like the input was cut off. Could you please provide the complete input so I can help you with the output?",
+    "\"\"\"\nConvert an action description to an emoji (important: use two or less emojis).\n\nAction description: being used\nEmoji:\n\"\"\"\nOutput the response to the prompt above in json. The value for the output must ONLY contain the emojis.\nExample output json:\n{\"output\": \"🛁🧖‍♀️\"}": "{\n    \"output\": \"🔨\"\n}",
+    "Task: Turn the input into (subject, predicate, object). \n\nInput: Sam Johnson is eating breakfast. \nOutput: (Dolores Murphy, eat, breakfast) \n--- \nInput: Joon Park is brewing coffee.\nOutput: (Joon Park, brew, coffee)\n---\nInput: Jane Cook is sleeping. \nOutput: (Jane Cook, is, sleep)\n---\nInput: Michael Bernstein is writing email on a computer. \nOutput: (Michael Bernstein, write, email)\n---\nInput: Percy Liang is teaching students in a classroom. \nOutput: (Percy Liang, teach, students)\n---\nInput: Merrie Morris is running on a treadmill. \nOutput: (Merrie Morris, run, treadmill)\n---\nInput: bed is being used. \nOutput: (bed,": "I'm sorry, but the input \"bed is being used\" does not follow the format of the previous examples where a subject, predicate, and object"
 }
\ No newline at end of file
diff --git a/tests/metagpt/actions/test_rebuild_sequence_view.py b/tests/metagpt/actions/test_rebuild_sequence_view.py
index 0e10e3776..9be3e8a99 100644
--- a/tests/metagpt/actions/test_rebuild_sequence_view.py
+++ b/tests/metagpt/actions/test_rebuild_sequence_view.py
@@ -18,6 +18,7 @@ from metagpt.utils.git_repository import ChangeType
 from metagpt.utils.graph_repository import SPO
 
 
+@pytest.mark.skip
 @pytest.mark.asyncio
 async def test_rebuild(context, mocker):
     # Mock
diff --git a/tests/metagpt/document_store/test_chromadb_store.py b/tests/metagpt/document_store/test_chromadb_store.py
index fd115dcdd..70b30d814 100644
--- a/tests/metagpt/document_store/test_chromadb_store.py
+++ b/tests/metagpt/document_store/test_chromadb_store.py
@@ -12,7 +12,7 @@ from metagpt.document_store.chromadb_store import ChromaStore
 def test_chroma_store():
     """FIXME：chroma使用感觉很诡异，一用Python就挂，测试用例里也是"""
     # 创建 ChromaStore 实例，使用 'sample_collection' 集合
-    document_store = ChromaStore("sample_collection_1")
+    document_store = ChromaStore("sample_collection_1", get_or_create=True)
 
     # 使用 write 方法添加多个文档
     document_store.write(
diff --git a/tests/metagpt/document_store/test_faiss_store.py b/tests/metagpt/document_store/test_faiss_store.py
index 397ba6ce5..a93b5f145 100644
--- a/tests/metagpt/document_store/test_faiss_store.py
+++ b/tests/metagpt/document_store/test_faiss_store.py
@@ -6,8 +6,6 @@
 @File    : test_faiss_store.py
 """
 
-from typing import Optional
-
 import numpy as np
 import pytest
 
@@ -17,18 +15,24 @@ from metagpt.logs import logger
 from metagpt.roles import Sales
 
 
-def mock_openai_embed_documents(self, texts: list[str], chunk_size: Optional[int] = 0) -> list[list[float]]:
+def mock_openai_embed_documents(self, texts: list[str], show_progress: bool = False) -> list[list[float]]:
     num = len(texts)
     embeds = np.random.randint(1, 100, size=(num, 1536))  # 1536: openai embedding dim
-    embeds = (embeds - embeds.mean(axis=0)) / (embeds.std(axis=0))
-    return embeds
+    embeds = (embeds - embeds.mean(axis=0)) / embeds.std(axis=0)
+    return embeds.tolist()
+
+
+def mock_openai_embed_document(self, text: str) -> list[float]:
+    embeds = mock_openai_embed_documents(self, [text])
+    return embeds[0]
 
 
 @pytest.mark.asyncio
 async def test_search_json(mocker):
-    mocker.patch("langchain_community.embeddings.openai.OpenAIEmbeddings.embed_documents", mock_openai_embed_documents)
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embeddings", mock_openai_embed_documents)
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embedding", mock_openai_embed_document)
 
-    store = FaissStore(EXAMPLE_PATH / "example.json")
+    store = FaissStore(EXAMPLE_PATH / "data/search_kb/example.json")
     role = Sales(profile="Sales", store=store)
     query = "Which facial cleanser is good for oily skin?"
     result = await role.run(query)
@@ -37,9 +41,10 @@ async def test_search_json(mocker):
 
 @pytest.mark.asyncio
 async def test_search_xlsx(mocker):
-    mocker.patch("langchain_community.embeddings.openai.OpenAIEmbeddings.embed_documents", mock_openai_embed_documents)
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embeddings", mock_openai_embed_documents)
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embedding", mock_openai_embed_document)
 
-    store = FaissStore(EXAMPLE_PATH / "example.xlsx")
+    store = FaissStore(EXAMPLE_PATH / "data/search_kb/example.xlsx", meta_col="Answer", content_col="Question")
     role = Sales(profile="Sales", store=store)
     query = "Which facial cleanser is good for oily skin?"
     result = await role.run(query)
@@ -48,9 +53,10 @@ async def test_search_xlsx(mocker):
 
 @pytest.mark.asyncio
 async def test_write(mocker):
-    mocker.patch("langchain_community.embeddings.openai.OpenAIEmbeddings.embed_documents", mock_openai_embed_documents)
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embeddings", mock_openai_embed_documents)
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embedding", mock_openai_embed_document)
 
-    store = FaissStore(EXAMPLE_PATH / "example.xlsx", meta_col="Answer", content_col="Question")
+    store = FaissStore(EXAMPLE_PATH / "data/search_kb/example.xlsx", meta_col="Answer", content_col="Question")
     _faiss_store = store.write()
-    assert _faiss_store.docstore
-    assert _faiss_store.index
+    assert _faiss_store.storage_context.docstore
+    assert _faiss_store.storage_context.vector_store.client
diff --git a/tests/metagpt/environment/android_env/test_android_ext_env.py b/tests/metagpt/environment/android_env/test_android_ext_env.py
index c9dfc718b..3fb77ab24 100644
--- a/tests/metagpt/environment/android_env/test_android_ext_env.py
+++ b/tests/metagpt/environment/android_env/test_android_ext_env.py
@@ -4,8 +4,8 @@
 
 from pathlib import Path
 
-from metagpt.environment.android_env.android_ext_env import AndroidExtEnv
-from metagpt.environment.android_env.const import ADB_EXEC_FAIL
+from metagpt.environment.android.android_ext_env import AndroidExtEnv
+from metagpt.environment.android.const import ADB_EXEC_FAIL
 
 
 def mock_device_shape(self, adb_cmd: str) -> str:
@@ -34,9 +34,7 @@ def mock_write_read_operation(self, adb_cmd: str) -> str:
 
 def test_android_ext_env(mocker):
     device_id = "emulator-5554"
-    mocker.patch(
-        "metagpt.environment.android_env.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_device_shape
-    )
+    mocker.patch("metagpt.environment.android.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_device_shape)
 
     ext_env = AndroidExtEnv(device_id=device_id, screenshot_dir="/data2/", xml_dir="/data2/")
     assert ext_env.adb_prefix == f"adb -s {device_id} "
@@ -46,25 +44,21 @@ def test_android_ext_env(mocker):
     assert ext_env.device_shape == (720, 1080)
 
     mocker.patch(
-        "metagpt.environment.android_env.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_device_shape_invalid
+        "metagpt.environment.android.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_device_shape_invalid
     )
     assert ext_env.device_shape == (0, 0)
 
-    mocker.patch(
-        "metagpt.environment.android_env.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_list_devices
-    )
+    mocker.patch("metagpt.environment.android.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_list_devices)
     assert ext_env.list_devices() == [device_id]
 
-    mocker.patch(
-        "metagpt.environment.android_env.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_get_screenshot
-    )
+    mocker.patch("metagpt.environment.android.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_get_screenshot)
     assert ext_env.get_screenshot("screenshot_xxxx-xx-xx", "/data/") == Path("/data/screenshot_xxxx-xx-xx.png")
 
-    mocker.patch("metagpt.environment.android_env.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_get_xml)
+    mocker.patch("metagpt.environment.android.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_get_xml)
     assert ext_env.get_xml("xml_xxxx-xx-xx", "/data/") == Path("/data/xml_xxxx-xx-xx.xml")
 
     mocker.patch(
-        "metagpt.environment.android_env.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_write_read_operation
+        "metagpt.environment.android.android_ext_env.AndroidExtEnv.execute_adb_with_cmd", mock_write_read_operation
     )
     res = "OK"
     assert ext_env.system_back() == res
diff --git a/tests/metagpt/environment/minecraft_env/__init__.py b/tests/metagpt/environment/minecraft_env/__init__.py
new file mode 100644
index 000000000..2bcf8efd0
--- /dev/null
+++ b/tests/metagpt/environment/minecraft_env/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/tests/metagpt/environment/mincraft_env/test_mincraft_ext_env.py b/tests/metagpt/environment/minecraft_env/test_minecraft_ext_env.py
similarity index 50%
rename from tests/metagpt/environment/mincraft_env/test_mincraft_ext_env.py
rename to tests/metagpt/environment/minecraft_env/test_minecraft_ext_env.py
index ad3376141..0ebff22eb 100644
--- a/tests/metagpt/environment/mincraft_env/test_mincraft_ext_env.py
+++ b/tests/metagpt/environment/minecraft_env/test_minecraft_ext_env.py
@@ -1,14 +1,14 @@
 #!/usr/bin/env python
 # -*- coding: utf-8 -*-
-# @Desc   : the unittest of MincraftExtEnv
+# @Desc   : the unittest of MinecraftExtEnv
 
 
-from metagpt.environment.mincraft_env.const import MC_CKPT_DIR
-from metagpt.environment.mincraft_env.mincraft_ext_env import MincraftExtEnv
+from metagpt.environment.minecraft.const import MC_CKPT_DIR
+from metagpt.environment.minecraft.minecraft_ext_env import MinecraftExtEnv
 
 
-def test_mincraft_ext_env():
-    ext_env = MincraftExtEnv()
+def test_minecraft_ext_env():
+    ext_env = MinecraftExtEnv()
     assert ext_env.server, f"{ext_env.server_host}:{ext_env.server_port}"
     assert MC_CKPT_DIR.joinpath("skill/code").exists()
     assert ext_env.warm_up.get("optional_inventory_items") == 7
diff --git a/tests/metagpt/environment/stanford_town_env/test_stanford_town_ext_env.py b/tests/metagpt/environment/stanford_town_env/test_stanford_town_ext_env.py
index 3071f9deb..282a45dfa 100644
--- a/tests/metagpt/environment/stanford_town_env/test_stanford_town_ext_env.py
+++ b/tests/metagpt/environment/stanford_town_env/test_stanford_town_ext_env.py
@@ -4,12 +4,18 @@
 
 from pathlib import Path
 
-from metagpt.environment.stanford_town_env.stanford_town_ext_env import (
-    StanfordTownExtEnv,
+from metagpt.environment.stanford_town.env_space import (
+    EnvAction,
+    EnvActionType,
+    EnvObsParams,
+    EnvObsType,
 )
+from metagpt.environment.stanford_town.stanford_town_ext_env import StanfordTownExtEnv
 
 maze_asset_path = (
-    Path(__file__).absolute().parent.joinpath("..", "..", "..", "data", "environment", "stanford_town", "the_ville")
+    Path(__file__)
+    .absolute()
+    .parent.joinpath("..", "..", "..", "..", "metagpt/ext/stanford_town/static_dirs/assets/the_ville")
 )
 
 
@@ -27,7 +33,6 @@ def test_stanford_town_ext_env():
     assert len(ext_env.get_nearby_tiles(tile=tile, vision_r=5)) == 121
 
     event = ("double studio:double studio:bedroom 2:bed", None, None, None)
-    ext_env.add_tiles_event(tile[1], tile[0], event=event)
     ext_env.add_event_from_tile(event, tile)
     assert len(ext_env.tiles[tile[1]][tile[0]]["events"]) == 1
 
@@ -38,3 +43,22 @@ def test_stanford_town_ext_env():
 
     ext_env.remove_subject_events_from_tile(subject=event[0], tile=tile)
     assert len(ext_env.tiles[tile[1]][tile[0]]["events"]) == 0
+
+
+def test_stanford_town_ext_env_observe_step():
+    ext_env = StanfordTownExtEnv(maze_asset_path=maze_asset_path)
+    obs, info = ext_env.reset()
+    assert len(info) == 0
+    assert len(obs["address_tiles"]) == 306
+
+    tile = (58, 9)
+    obs = ext_env.observe(obs_params=EnvObsParams(obs_type=EnvObsType.TILE_PATH, coord=tile, level="world"))
+    assert obs == "the Ville"
+
+    action = ext_env.action_space.sample()
+    assert len(action) == 4
+    assert len(action["event"]) == 4
+
+    event = ("double studio:double studio:bedroom 2:bed", None, None, None)
+    obs, _, _, _, _ = ext_env.step(action=EnvAction(action_type=EnvActionType.ADD_TILE_EVENT, coord=tile, event=event))
+    assert len(ext_env.tiles[tile[1]][tile[0]]["events"]) == 1
diff --git a/tests/metagpt/environment/test_base_env.py b/tests/metagpt/environment/test_base_env.py
index fd73679d8..404f1c206 100644
--- a/tests/metagpt/environment/test_base_env.py
+++ b/tests/metagpt/environment/test_base_env.py
@@ -2,6 +2,8 @@
 # -*- coding: utf-8 -*-
 # @Desc   : the unittest of ExtEnv&Env
 
+from typing import Any, Optional
+
 import pytest
 
 from metagpt.environment.api.env_api import EnvAPIAbstract
@@ -12,11 +14,26 @@ from metagpt.environment.base_env import (
     mark_as_readable,
     mark_as_writeable,
 )
+from metagpt.environment.base_env_space import BaseEnvAction, BaseEnvObsParams
 
 
 class ForTestEnv(Environment):
     value: int = 0
 
+    def reset(
+        self,
+        *,
+        seed: Optional[int] = None,
+        options: Optional[dict[str, Any]] = None,
+    ) -> tuple[dict[str, Any], dict[str, Any]]:
+        pass
+
+    def observe(self, obs_params: Optional[BaseEnvObsParams] = None) -> Any:
+        pass
+
+    def step(self, action: BaseEnvAction) -> tuple[dict[str, Any], float, bool, bool, dict[str, Any]]:
+        pass
+
     @mark_as_readable
     def read_api_no_param(self):
         return self.value
@@ -44,11 +61,11 @@ async def test_ext_env():
     assert len(apis) > 0
     assert len(apis["read_api"]) == 3
 
-    _ = await env.step(EnvAPIAbstract(api_name="write_api", kwargs={"a": 5, "b": 10}))
+    _ = await env.write_thru_api(EnvAPIAbstract(api_name="write_api", kwargs={"a": 5, "b": 10}))
     assert env.value == 15
 
     with pytest.raises(ValueError):
-        await env.observe("not_exist_api")
+        await env.read_from_api("not_exist_api")
 
-    assert await env.observe("read_api_no_param") == 15
-    assert await env.observe(EnvAPIAbstract(api_name="read_api", kwargs={"a": 5, "b": 5})) == 10
+    assert await env.read_from_api("read_api_no_param") == 15
+    assert await env.read_from_api(EnvAPIAbstract(api_name="read_api", kwargs={"a": 5, "b": 5})) == 10
diff --git a/tests/metagpt/environment/werewolf_env/test_werewolf_ext_env.py b/tests/metagpt/environment/werewolf_env/test_werewolf_ext_env.py
index 0694c5c3d..433f59f2c 100644
--- a/tests/metagpt/environment/werewolf_env/test_werewolf_ext_env.py
+++ b/tests/metagpt/environment/werewolf_env/test_werewolf_ext_env.py
@@ -2,7 +2,7 @@
 # -*- coding: utf-8 -*-
 # @Desc   : the unittest of WerewolfExtEnv
 
-from metagpt.environment.werewolf_env.werewolf_ext_env import RoleState, WerewolfExtEnv
+from metagpt.environment.werewolf.werewolf_ext_env import RoleState, WerewolfExtEnv
 from metagpt.roles.role import Role
 
 
diff --git a/tests/metagpt/ext/__init__.py b/tests/metagpt/ext/__init__.py
new file mode 100644
index 000000000..2bcf8efd0
--- /dev/null
+++ b/tests/metagpt/ext/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/tests/metagpt/ext/stanford_town/__init__.py b/tests/metagpt/ext/stanford_town/__init__.py
new file mode 100644
index 000000000..2bcf8efd0
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/tests/metagpt/ext/stanford_town/actions/__init__.py b/tests/metagpt/ext/stanford_town/actions/__init__.py
new file mode 100644
index 000000000..2bcf8efd0
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/actions/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/tests/metagpt/ext/stanford_town/actions/test_gen_action_details.py b/tests/metagpt/ext/stanford_town/actions/test_gen_action_details.py
new file mode 100644
index 000000000..616c03f33
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/actions/test_gen_action_details.py
@@ -0,0 +1,79 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : unittest of actions/gen_action_details.py
+
+import pytest
+
+from metagpt.environment import StanfordTownEnv
+from metagpt.environment.api.env_api import EnvAPIAbstract
+from metagpt.ext.stanford_town.actions.gen_action_details import (
+    GenActionArena,
+    GenActionDetails,
+    GenActionObject,
+    GenActionSector,
+    GenActObjDescription,
+)
+from metagpt.ext.stanford_town.roles.st_role import STRole
+from metagpt.ext.stanford_town.utils.const import MAZE_ASSET_PATH
+
+
+@pytest.mark.asyncio
+async def test_gen_action_details():
+    role = STRole(
+        name="Klaus Mueller",
+        start_time="February 13, 2023",
+        curr_time="February 13, 2023, 00:00:00",
+        sim_code="base_the_ville_isabella_maria_klaus",
+    )
+    role.set_env(StanfordTownEnv(maze_asset_path=MAZE_ASSET_PATH))
+    await role.init_curr_tile()
+
+    act_desp = "sleeping"
+    act_dura = "120"
+
+    access_tile = await role.rc.env.read_from_api(
+        EnvAPIAbstract(api_name="access_tile", kwargs={"tile": role.scratch.curr_tile})
+    )
+    act_world = access_tile["world"]
+    assert act_world == "the Ville"
+
+    sector = await GenActionSector().run(role, access_tile, act_desp)
+    arena = await GenActionArena().run(role, act_desp, act_world, sector)
+    temp_address = f"{act_world}:{sector}:{arena}"
+    obj = await GenActionObject().run(role, act_desp, temp_address)
+
+    act_obj_desp = await GenActObjDescription().run(role, obj, act_desp)
+
+    result_dict = await GenActionDetails().run(role, act_desp, act_dura)
+
+    # gen_action_sector
+    assert isinstance(sector, str)
+    assert sector in role.s_mem.get_str_accessible_sectors(act_world)
+
+    # gen_action_arena
+    assert isinstance(arena, str)
+    assert arena in role.s_mem.get_str_accessible_sector_arenas(f"{act_world}:{sector}")
+
+    # gen_action_obj
+    assert isinstance(obj, str)
+    assert obj in role.s_mem.get_str_accessible_arena_game_objects(temp_address)
+
+    if result_dict:
+        for key in [
+            "action_address",
+            "action_duration",
+            "action_description",
+            "action_pronunciatio",
+            "action_event",
+            "chatting_with",
+            "chat",
+            "chatting_with_buffer",
+            "chatting_end_time",
+            "act_obj_description",
+            "act_obj_pronunciatio",
+            "act_obj_event",
+        ]:
+            assert key in result_dict
+    assert result_dict["action_address"] == f"{temp_address}:{obj}"
+    assert result_dict["action_duration"] == int(act_dura)
+    assert result_dict["act_obj_description"] == act_obj_desp
diff --git a/tests/metagpt/ext/stanford_town/actions/test_summarize_conv.py b/tests/metagpt/ext/stanford_town/actions/test_summarize_conv.py
new file mode 100644
index 000000000..5dfabcab9
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/actions/test_summarize_conv.py
@@ -0,0 +1,15 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : unittest of actions/summarize_conv
+
+import pytest
+
+from metagpt.ext.stanford_town.actions.summarize_conv import SummarizeConv
+
+
+@pytest.mark.asyncio
+async def test_summarize_conv():
+    conv = [("Role_A", "what's the weather today?"), ("Role_B", "It looks pretty good, and I will take a walk then.")]
+
+    output = await SummarizeConv().run(conv)
+    assert "weather" in output
diff --git a/tests/metagpt/ext/stanford_town/memory/__init__.py b/tests/metagpt/ext/stanford_town/memory/__init__.py
new file mode 100644
index 000000000..2bcf8efd0
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/memory/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/tests/metagpt/ext/stanford_town/memory/test_agent_memory.py b/tests/metagpt/ext/stanford_town/memory/test_agent_memory.py
new file mode 100644
index 000000000..db7ca3212
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/memory/test_agent_memory.py
@@ -0,0 +1,89 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : the unittest of AgentMemory
+
+from datetime import datetime, timedelta
+
+import pytest
+
+from metagpt.ext.stanford_town.memory.agent_memory import AgentMemory
+from metagpt.ext.stanford_town.memory.retrieve import agent_retrieve
+from metagpt.ext.stanford_town.utils.const import STORAGE_PATH
+from metagpt.logs import logger
+
+"""
+memory测试思路
+1. Basic Memory测试
+2. Agent Memory测试
+    2.1 Load & Save方法测试; Load方法中使用了add方法，验证Load即可验证所有add
+    2.2 Get方法测试
+"""
+memory_easy_storage_path = STORAGE_PATH.joinpath(
+    "base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory",
+)
+memroy_chat_storage_path = STORAGE_PATH.joinpath(
+    "base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/associative_memory",
+)
+memory_save_easy_test_path = STORAGE_PATH.joinpath(
+    "base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/test_memory",
+)
+memory_save_chat_test_path = STORAGE_PATH.joinpath(
+    "base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/test_memory",
+)
+
+
+class TestAgentMemory:
+    @pytest.fixture
+    def agent_memory(self):
+        # 创建一个AgentMemory实例并返回，可以在所有测试用例中共享
+        test_agent_memory = AgentMemory()
+        test_agent_memory.set_mem_path(memroy_chat_storage_path)
+        return test_agent_memory
+
+    def test_load(self, agent_memory):
+        logger.info(f"存储路径为：{agent_memory.memory_saved}")
+        logger.info(f"存储记忆条数为：{len(agent_memory.storage)}")
+        logger.info(f"kw_strength为{agent_memory.kw_strength_event},{agent_memory.kw_strength_thought}")
+        logger.info(f"embeeding.json条数为{len(agent_memory.embeddings)}")
+
+        assert agent_memory.embeddings is not None
+
+    def test_save(self, agent_memory):
+        try:
+            agent_memory.save(memory_save_chat_test_path)
+            logger.info("成功存储")
+        except:
+            pass
+
+    def test_summary_function(self, agent_memory):
+        logger.info(f"event长度为{len(agent_memory.event_list)}")
+        logger.info(f"thought长度为{len(agent_memory.thought_list)}")
+        logger.info(f"chat长度为{len(agent_memory.chat_list)}")
+        result1 = agent_memory.get_summarized_latest_events(4)
+        logger.info(f"总结最近事件结果为:{result1}")
+
+    def test_get_last_chat_function(self, agent_memory):
+        result2 = agent_memory.get_last_chat("customers")
+        logger.info(f"上一次对话是{result2}")
+
+    def test_retrieve_function(self, agent_memory):
+        focus_points = ["who i love?"]
+        retrieved = dict()
+        for focal_pt in focus_points:
+            nodes = [
+                [i.last_accessed, i]
+                for i in agent_memory.event_list + agent_memory.thought_list
+                if "idle" not in i.embedding_key
+            ]
+            nodes = sorted(nodes, key=lambda x: x[0])
+            nodes = [i for created, i in nodes]
+            results = agent_retrieve(agent_memory, datetime.now() - timedelta(days=120), 0.99, focal_pt, nodes, 5)
+            final_result = []
+            for n in results:
+                for i in agent_memory.storage:
+                    if i.memory_id == n:
+                        i.last_accessed = datetime.now() - timedelta(days=120)
+                        final_result.append(i)
+
+            retrieved[focal_pt] = final_result
+        logger.info(f"检索结果为{retrieved}")
diff --git a/tests/metagpt/ext/stanford_town/memory/test_basic_memory.py b/tests/metagpt/ext/stanford_town/memory/test_basic_memory.py
new file mode 100644
index 000000000..36a9b2f99
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/memory/test_basic_memory.py
@@ -0,0 +1,76 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : the unittest of BasicMemory
+
+from datetime import datetime, timedelta
+
+import pytest
+
+from metagpt.ext.stanford_town.memory.agent_memory import BasicMemory
+from metagpt.logs import logger
+
+"""
+memory测试思路
+1. Basic Memory测试
+2. Agent Memory测试
+    2.1 Load & Save方法测试
+    2.2 Add方法测试
+    2.3 Get方法测试
+"""
+
+# Create some sample BasicMemory instances
+memory1 = BasicMemory(
+    memory_id="1",
+    memory_count=1,
+    type_count=1,
+    memory_type="event",
+    depth=1,
+    created=datetime.now(),
+    expiration=datetime.now() + timedelta(days=30),
+    subject="Subject1",
+    predicate="Predicate1",
+    object="Object1",
+    content="This is content 1",
+    embedding_key="embedding_key_1",
+    poignancy=1,
+    keywords=["keyword1", "keyword2"],
+    filling=["memory_id_2"],
+)
+memory2 = BasicMemory(
+    memory_id="2",
+    memory_count=2,
+    type_count=2,
+    memory_type="thought",
+    depth=2,
+    created=datetime.now(),
+    expiration=datetime.now() + timedelta(days=30),
+    subject="Subject2",
+    predicate="Predicate2",
+    object="Object2",
+    content="This is content 2",
+    embedding_key="embedding_key_2",
+    poignancy=2,
+    keywords=["keyword3", "keyword4"],
+    filling=[],
+)
+
+
+@pytest.fixture
+def basic_mem_set():
+    basic_mem2 = memory2
+    yield basic_mem2
+
+
+def test_basic_mem_function(basic_mem_set):
+    a, b, c = basic_mem_set.summary()
+    logger.info(f"{a}{b}{c}")
+    assert a == "Subject2"
+
+
+def test_basic_mem_save(basic_mem_set):
+    result = basic_mem_set.save_to_dict()
+    logger.info(f"save结果为{result}")
+
+
+if __name__ == "__main__":
+    pytest.main()
diff --git a/tests/metagpt/ext/stanford_town/memory/test_spatial_memory.py b/tests/metagpt/ext/stanford_town/memory/test_spatial_memory.py
new file mode 100644
index 000000000..e05b273fd
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/memory/test_spatial_memory.py
@@ -0,0 +1,17 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : the unittest of MemoryTree
+
+from metagpt.ext.stanford_town.memory.spatial_memory import MemoryTree
+from metagpt.ext.stanford_town.utils.const import STORAGE_PATH
+
+
+def test_spatial_memory():
+    f_path = STORAGE_PATH.joinpath(
+        "base_the_ville_isabella_maria_klaus/personas/Isabella Rodriguez/bootstrap_memory/spatial_memory.json"
+    )
+    x = MemoryTree()
+    x.set_mem_path(f_path)
+    assert x.tree
+    assert "the Ville" in x.tree
+    assert "Isabella Rodriguez's apartment" in x.get_str_accessible_sectors("the Ville")
diff --git a/tests/metagpt/ext/stanford_town/plan/__init__.py b/tests/metagpt/ext/stanford_town/plan/__init__.py
new file mode 100644
index 000000000..2bcf8efd0
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/plan/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/tests/metagpt/ext/stanford_town/plan/test_conversation.py b/tests/metagpt/ext/stanford_town/plan/test_conversation.py
new file mode 100644
index 000000000..35dd216f9
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/plan/test_conversation.py
@@ -0,0 +1,67 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : unittest of roles conversation
+
+from typing import Tuple
+
+import pytest
+
+from metagpt.environment import StanfordTownEnv
+from metagpt.ext.stanford_town.plan.converse import agent_conversation
+from metagpt.ext.stanford_town.roles.st_role import STRole
+from metagpt.ext.stanford_town.utils.const import MAZE_ASSET_PATH, STORAGE_PATH
+from metagpt.ext.stanford_town.utils.mg_ga_transform import get_reverie_meta
+from metagpt.ext.stanford_town.utils.utils import copy_folder
+
+
+async def init_two_roles(fork_sim_code: str = "base_the_ville_isabella_maria_klaus") -> Tuple["STRole"]:
+    sim_code = "unittest_sim"
+
+    copy_folder(str(STORAGE_PATH.joinpath(fork_sim_code)), str(STORAGE_PATH.joinpath(sim_code)))
+
+    reverie_meta = get_reverie_meta(fork_sim_code)
+    role_ir_name = "Isabella Rodriguez"
+    role_km_name = "Klaus Mueller"
+
+    env = StanfordTownEnv(maze_asset_path=MAZE_ASSET_PATH)
+
+    role_ir = STRole(
+        name=role_ir_name,
+        sim_code=sim_code,
+        profile=role_ir_name,
+        step=reverie_meta.get("step"),
+        start_time=reverie_meta.get("start_date"),
+        curr_time=reverie_meta.get("curr_time"),
+        sec_per_step=reverie_meta.get("sec_per_step"),
+    )
+    role_ir.set_env(env)
+    await role_ir.init_curr_tile()
+
+    role_km = STRole(
+        name=role_km_name,
+        sim_code=sim_code,
+        profile=role_km_name,
+        step=reverie_meta.get("step"),
+        start_time=reverie_meta.get("start_date"),
+        curr_time=reverie_meta.get("curr_time"),
+        sec_per_step=reverie_meta.get("sec_per_step"),
+    )
+    role_km.set_env(env)
+    await role_km.init_curr_tile()
+
+    return role_ir, role_km
+
+
+@pytest.mark.asyncio
+async def test_agent_conversation():
+    role_ir, role_km = await init_two_roles()
+
+    curr_chat = await agent_conversation(role_ir, role_km, conv_rounds=2)
+    assert len(curr_chat) % 2 == 0
+
+    meet = False
+    for conv in curr_chat:
+        if "Valentine's Day party" in conv[1]:
+            # conv[0] speaker, conv[1] utterance
+            meet = True
+    assert meet
diff --git a/tests/metagpt/ext/stanford_town/plan/test_st_plan.py b/tests/metagpt/ext/stanford_town/plan/test_st_plan.py
new file mode 100644
index 000000000..f7f395040
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/plan/test_st_plan.py
@@ -0,0 +1,25 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : unittest of st_plan
+
+
+import pytest
+
+from metagpt.ext.stanford_town.plan.st_plan import _choose_retrieved, _should_react
+from tests.metagpt.ext.stanford_town.plan.test_conversation import init_two_roles
+
+
+@pytest.mark.asyncio
+async def test_should_react():
+    role_ir, role_km = await init_two_roles()
+    roles = {role_ir.name: role_ir, role_km.name: role_km}
+    role_ir.scratch.act_address = "mock data"
+
+    observed = await role_ir.observe()
+    retrieved = role_ir.retrieve(observed)
+
+    focused_event = _choose_retrieved(role_ir.name, retrieved)
+
+    if focused_event:
+        reaction_mode = await _should_react(role_ir, focused_event, roles)  # chat with Isabella Rodriguez
+        assert not reaction_mode
diff --git a/tests/metagpt/ext/stanford_town/roles/__init__.py b/tests/metagpt/ext/stanford_town/roles/__init__.py
new file mode 100644
index 000000000..2bcf8efd0
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/roles/__init__.py
@@ -0,0 +1,3 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   :
diff --git a/tests/metagpt/ext/stanford_town/roles/test_st_role.py b/tests/metagpt/ext/stanford_town/roles/test_st_role.py
new file mode 100644
index 000000000..affa6e87f
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/roles/test_st_role.py
@@ -0,0 +1,26 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : the unittest of STRole
+
+import pytest
+
+from metagpt.environment import StanfordTownEnv
+from metagpt.ext.stanford_town.memory.agent_memory import BasicMemory
+from metagpt.ext.stanford_town.roles.st_role import STRole
+from metagpt.ext.stanford_town.utils.const import MAZE_ASSET_PATH
+
+
+@pytest.mark.asyncio
+async def test_observe():
+    role = STRole(
+        sim_code="base_the_ville_isabella_maria_klaus",
+        start_time="February 13, 2023",
+        curr_time="February 13, 2023, 00:00:00",
+    )
+    role.set_env(StanfordTownEnv(maze_asset_path=MAZE_ASSET_PATH))
+    await role.init_curr_tile()
+
+    ret_events = await role.observe()
+    assert ret_events
+    for event in ret_events:
+        assert isinstance(event, BasicMemory)
diff --git a/tests/metagpt/ext/stanford_town/test_reflect.py b/tests/metagpt/ext/stanford_town/test_reflect.py
new file mode 100644
index 000000000..0be23166c
--- /dev/null
+++ b/tests/metagpt/ext/stanford_town/test_reflect.py
@@ -0,0 +1,47 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# @Desc   : the unittest of reflection
+
+import pytest
+
+from metagpt.environment import StanfordTownEnv
+from metagpt.ext.stanford_town.actions.run_reflect_action import (
+    AgentEventTriple,
+    AgentFocusPt,
+    AgentInsightAndGuidance,
+)
+from metagpt.ext.stanford_town.roles.st_role import STRole
+from metagpt.ext.stanford_town.utils.const import MAZE_ASSET_PATH
+
+
+@pytest.mark.asyncio
+async def test_reflect():
+    """
+    init STRole form local json, set sim_code(path),curr_time & start_time
+    """
+    role = STRole(
+        sim_code="base_the_ville_isabella_maria_klaus",
+        start_time="February 13, 2023",
+        curr_time="February 13, 2023, 00:00:00",
+    )
+    role.set_env(StanfordTownEnv(maze_asset_path=MAZE_ASSET_PATH))
+    role.init_curr_tile()
+
+    run_focus = AgentFocusPt()
+    statements = ""
+    await run_focus.run(role, statements, n=3)
+
+    """
+    这里有通过测试的结果，但是更多时候LLM生成的结果缺少了because of；考虑修改一下prompt
+    result = {'Klaus Mueller and Maria Lopez have a close relationship because they have been friends for a long time and have a strong bond': [1, 2, 5, 9, 11, 14], 'Klaus Mueller has a crush on Maria Lopez': [8, 15, 24], 'Klaus Mueller is academically inclined and actively researching a topic': [13, 20], 'Klaus Mueller is socially active and acquainted with Isabella Rodriguez': [17, 21, 22], 'Klaus Mueller is organized and prepared': [19]}
+    """
+    run_insight = AgentInsightAndGuidance()
+    statements = "[user: Klaus Mueller has a close relationship with Maria Lopez, user:s Mueller and Maria Lopez have a close relationship, user: Klaus Mueller has a close relationship with Maria Lopez, user: Klaus Mueller has a close relationship with Maria Lopez, user: Klaus Mueller and Maria Lopez have a strong relationship, user: Klaus Mueller is a dormmate of Maria Lopez., user: Klaus Mueller and Maria Lopez have a strong bond, user: Klaus Mueller has a crush on Maria Lopez, user: Klaus Mueller and Maria Lopez have been friends for more than 2 years., user: Klaus Mueller has a close relationship with Maria Lopez, user: Klaus Mueller Maria Lopez is heading off to college., user: Klaus Mueller and Maria Lopez have a close relationship, user: Klaus Mueller is actively researching a topic, user: Klaus Mueller is close friends and classmates with Maria Lopez., user: Klaus Mueller is socially active, user: Klaus Mueller has a crush on Maria Lopez., user: Klaus Mueller and Maria Lopez have been friends for a long time, user: Klaus Mueller is academically inclined, user: For Klaus Mueller's planning: should remember to ask Maria Lopez about her research paper, as she found it interesting that he mentioned it., user: Klaus Mueller is acquainted with Isabella Rodriguez, user: Klaus Mueller is organized and prepared, user: Maria Lopez is conversing about conversing about Maria's research paper mentioned by Klaus, user: Klaus Mueller is conversing about conversing about Maria's research paper mentioned by Klaus, user: Klaus Mueller is a student, user: Klaus Mueller is a student, user: Klaus Mueller is conversing about two friends named Klaus Mueller and Maria Lopez discussing their morning plans and progress on a research paper before Maria heads off to college., user: Klaus Mueller is socially active, user: Klaus Mueller is socially active, user: Klaus Mueller is socially active and acquainted with Isabella Rodriguez, user: Klaus Mueller has a crush on Maria Lopez]"
+    await run_insight.run(role, statements, n=5)
+
+    run_triple = AgentEventTriple()
+    statements = "(Klaus Mueller is academically inclined)"
+    await run_triple.run(statements, role)
+
+    role.scratch.importance_trigger_curr = -1
+    role.reflect()
diff --git a/tests/metagpt/memory/mock_text_embed.py b/tests/metagpt/memory/mock_text_embed.py
index 897c7cf10..2f3ffc434 100644
--- a/tests/metagpt/memory/mock_text_embed.py
+++ b/tests/metagpt/memory/mock_text_embed.py
@@ -2,32 +2,41 @@
 # -*- coding: utf-8 -*-
 # @Desc   :
 
-from typing import Optional
-
 import numpy as np
 
 dim = 1536  # openai embedding dim
+embed_zeros_arrr = np.zeros(shape=[1, dim]).tolist()
+embed_ones_arrr = np.ones(shape=[1, dim]).tolist()
 
 text_embed_arr = [
-    {"text": "Write a cli snake game", "embed": np.zeros(shape=[1, dim])},  # mock data, same as below
-    {"text": "Write a game of cli snake", "embed": np.zeros(shape=[1, dim])},
-    {"text": "Write a 2048 web game", "embed": np.ones(shape=[1, dim])},
-    {"text": "Write a Battle City", "embed": np.ones(shape=[1, dim])},
+    {"text": "Write a cli snake game", "embed": embed_zeros_arrr},  # mock data, same as below
+    {"text": "Write a game of cli snake", "embed": embed_zeros_arrr},
+    {"text": "Write a 2048 web game", "embed": embed_ones_arrr},
+    {"text": "Write a Battle City", "embed": embed_ones_arrr},
     {
         "text": "The user has requested the creation of a command-line interface (CLI) snake game",
-        "embed": np.zeros(shape=[1, dim]),
+        "embed": embed_zeros_arrr,
     },
-    {"text": "The request is command-line interface (CLI) snake game", "embed": np.zeros(shape=[1, dim])},
+    {"text": "The request is command-line interface (CLI) snake game", "embed": embed_zeros_arrr},
     {
         "text": "Incorporate basic features of a snake game such as scoring and increasing difficulty",
-        "embed": np.ones(shape=[1, dim]),
+        "embed": embed_ones_arrr,
     },
 ]
 
 text_idx_dict = {item["text"]: idx for idx, item in enumerate(text_embed_arr)}
 
 
-def mock_openai_embed_documents(self, texts: list[str], chunk_size: Optional[int] = 0) -> list[list[float]]:
+def mock_openai_embed_documents(self, texts: list[str], show_progress: bool = False) -> list[list[float]]:
     idx = text_idx_dict.get(texts[0])
     embed = text_embed_arr[idx].get("embed")
     return embed
+
+
+def mock_openai_embed_document(self, text: str) -> list[float]:
+    embeds = mock_openai_embed_documents(self, [text])
+    return embeds[0]
+
+
+async def mock_openai_aembed_document(self, text: str) -> list[float]:
+    return mock_openai_embed_document(self, text)
diff --git a/tests/metagpt/memory/test_longterm_memory.py b/tests/metagpt/memory/test_longterm_memory.py
index f7e652758..990017fee 100644
--- a/tests/metagpt/memory/test_longterm_memory.py
+++ b/tests/metagpt/memory/test_longterm_memory.py
@@ -12,13 +12,20 @@ from metagpt.memory.longterm_memory import LongTermMemory
 from metagpt.roles.role import RoleContext
 from metagpt.schema import Message
 from tests.metagpt.memory.mock_text_embed import (
+    mock_openai_aembed_document,
+    mock_openai_embed_document,
     mock_openai_embed_documents,
     text_embed_arr,
 )
 
 
-def test_ltm_search(mocker):
-    mocker.patch("langchain_community.embeddings.openai.OpenAIEmbeddings.embed_documents", mock_openai_embed_documents)
+@pytest.mark.asyncio
+async def test_ltm_search(mocker):
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embeddings", mock_openai_embed_documents)
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embedding", mock_openai_embed_document)
+    mocker.patch(
+        "llama_index.embeddings.openai.base.OpenAIEmbedding._aget_query_embedding", mock_openai_aembed_document
+    )
 
     role_id = "UTUserLtm(Product Manager)"
     from metagpt.environment import Environment
@@ -31,39 +38,24 @@ def test_ltm_search(mocker):
 
     idea = text_embed_arr[0].get("text", "Write a cli snake game")
     message = Message(role="User", content=idea, cause_by=UserRequirement)
-    news = ltm.find_news([message])
+    news = await ltm.find_news([message])
     assert len(news) == 1
     ltm.add(message)
 
     sim_idea = text_embed_arr[1].get("text", "Write a game of cli snake")
 
     sim_message = Message(role="User", content=sim_idea, cause_by=UserRequirement)
-    news = ltm.find_news([sim_message])
+    news = await ltm.find_news([sim_message])
     assert len(news) == 0
     ltm.add(sim_message)
 
     new_idea = text_embed_arr[2].get("text", "Write a 2048 web game")
     new_message = Message(role="User", content=new_idea, cause_by=UserRequirement)
-    news = ltm.find_news([new_message])
+    news = await ltm.find_news([new_message])
     assert len(news) == 1
     ltm.add(new_message)
 
-    # restore from local index
-    ltm_new = LongTermMemory()
-    ltm_new.recover_memory(role_id, rc)
-    news = ltm_new.find_news([message])
-    assert len(news) == 0
-
-    ltm_new.recover_memory(role_id, rc)
-    news = ltm_new.find_news([sim_message])
-    assert len(news) == 0
-
-    new_idea = text_embed_arr[3].get("text", "Write a Battle City")
-    new_message = Message(role="User", content=new_idea, cause_by=UserRequirement)
-    news = ltm_new.find_news([new_message])
-    assert len(news) == 1
-
-    ltm_new.clear()
+    ltm.clear()
 
 
 if __name__ == "__main__":
diff --git a/tests/metagpt/memory/test_memory_storage.py b/tests/metagpt/memory/test_memory_storage.py
index 28a73276b..09671aaab 100644
--- a/tests/metagpt/memory/test_memory_storage.py
+++ b/tests/metagpt/memory/test_memory_storage.py
@@ -8,19 +8,28 @@ import shutil
 from pathlib import Path
 from typing import List
 
+import pytest
+
 from metagpt.actions import UserRequirement, WritePRD
 from metagpt.actions.action_node import ActionNode
 from metagpt.const import DATA_PATH
 from metagpt.memory.memory_storage import MemoryStorage
 from metagpt.schema import Message
 from tests.metagpt.memory.mock_text_embed import (
+    mock_openai_aembed_document,
+    mock_openai_embed_document,
     mock_openai_embed_documents,
     text_embed_arr,
 )
 
 
-def test_idea_message(mocker):
-    mocker.patch("langchain_community.embeddings.openai.OpenAIEmbeddings.embed_documents", mock_openai_embed_documents)
+@pytest.mark.asyncio
+async def test_idea_message(mocker):
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embeddings", mock_openai_embed_documents)
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embedding", mock_openai_embed_document)
+    mocker.patch(
+        "llama_index.embeddings.openai.base.OpenAIEmbedding._aget_query_embedding", mock_openai_aembed_document
+    )
 
     idea = text_embed_arr[0].get("text", "Write a cli snake game")
     role_id = "UTUser1(Product Manager)"
@@ -29,28 +38,32 @@ def test_idea_message(mocker):
     shutil.rmtree(Path(DATA_PATH / f"role_mem/{role_id}/"), ignore_errors=True)
 
     memory_storage: MemoryStorage = MemoryStorage()
-    messages = memory_storage.recover_memory(role_id)
-    assert len(messages) == 0
+    memory_storage.recover_memory(role_id)
 
     memory_storage.add(message)
     assert memory_storage.is_initialized is True
 
     sim_idea = text_embed_arr[1].get("text", "Write a game of cli snake")
     sim_message = Message(role="User", content=sim_idea, cause_by=UserRequirement)
-    new_messages = memory_storage.search_dissimilar(sim_message)
-    assert len(new_messages) == 0  # similar, return []
+    new_messages = await memory_storage.search_similar(sim_message)
+    assert len(new_messages) == 1  # similar, return []
 
     new_idea = text_embed_arr[2].get("text", "Write a 2048 web game")
     new_message = Message(role="User", content=new_idea, cause_by=UserRequirement)
-    new_messages = memory_storage.search_dissimilar(new_message)
-    assert new_messages[0].content == message.content
+    new_messages = await memory_storage.search_similar(new_message)
+    assert len(new_messages) == 0
 
     memory_storage.clean()
     assert memory_storage.is_initialized is False
 
 
-def test_actionout_message(mocker):
-    mocker.patch("langchain_community.embeddings.openai.OpenAIEmbeddings.embed_documents", mock_openai_embed_documents)
+@pytest.mark.asyncio
+async def test_actionout_message(mocker):
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embeddings", mock_openai_embed_documents)
+    mocker.patch("llama_index.embeddings.openai.base.OpenAIEmbedding._get_text_embedding", mock_openai_embed_document)
+    mocker.patch(
+        "llama_index.embeddings.openai.base.OpenAIEmbedding._aget_query_embedding", mock_openai_aembed_document
+    )
 
     out_mapping = {"field1": (str, ...), "field2": (List[str], ...)}
     out_data = {"field1": "field1 value", "field2": ["field2 value1", "field2 value2"]}
@@ -67,23 +80,22 @@ def test_actionout_message(mocker):
     shutil.rmtree(Path(DATA_PATH / f"role_mem/{role_id}/"), ignore_errors=True)
 
     memory_storage: MemoryStorage = MemoryStorage()
-    messages = memory_storage.recover_memory(role_id)
-    assert len(messages) == 0
+    memory_storage.recover_memory(role_id)
 
     memory_storage.add(message)
     assert memory_storage.is_initialized is True
 
     sim_conent = text_embed_arr[5].get("text", "The request is command-line interface (CLI) snake game")
     sim_message = Message(content=sim_conent, instruct_content=ic_obj(**out_data), role="user", cause_by=WritePRD)
-    new_messages = memory_storage.search_dissimilar(sim_message)
-    assert len(new_messages) == 0  # similar, return []
+    new_messages = await memory_storage.search_similar(sim_message)
+    assert len(new_messages) == 1  # similar, return []
 
     new_conent = text_embed_arr[6].get(
         "text", "Incorporate basic features of a snake game such as scoring and increasing difficulty"
     )
     new_message = Message(content=new_conent, instruct_content=ic_obj(**out_data), role="user", cause_by=WritePRD)
-    new_messages = memory_storage.search_dissimilar(new_message)
-    assert new_messages[0].content == message.content
+    new_messages = await memory_storage.search_similar(new_message)
+    assert len(new_messages) == 0
 
     memory_storage.clean()
     assert memory_storage.is_initialized is False
diff --git a/tests/metagpt/provider/test_base_llm.py b/tests/metagpt/provider/test_base_llm.py
index bff8dbde4..40a9fda92 100644
--- a/tests/metagpt/provider/test_base_llm.py
+++ b/tests/metagpt/provider/test_base_llm.py
@@ -11,6 +11,7 @@ import pytest
 from metagpt.configs.llm_config import LLMConfig
 from metagpt.provider.base_llm import BaseLLM
 from metagpt.schema import Message
+from tests.metagpt.provider.mock_llm_config import mock_llm_config
 from tests.metagpt.provider.req_resp_const import (
     default_resp_cont,
     get_part_chat_completion,
@@ -22,7 +23,7 @@ name = "GPT"
 
 class MockBaseLLM(BaseLLM):
     def __init__(self, config: LLMConfig = None):
-        pass
+        self.config = config or mock_llm_config
 
     def completion(self, messages: list[dict], timeout=3):
         return get_part_chat_completion(name)
diff --git a/tests/metagpt/rag/engines/test_simple.py b/tests/metagpt/rag/engines/test_simple.py
new file mode 100644
index 000000000..9262ccb07
--- /dev/null
+++ b/tests/metagpt/rag/engines/test_simple.py
@@ -0,0 +1,310 @@
+import json
+
+import pytest
+from llama_index.core import VectorStoreIndex
+from llama_index.core.embeddings import MockEmbedding
+from llama_index.core.llms import MockLLM
+from llama_index.core.schema import Document, NodeWithScore, TextNode
+
+from metagpt.rag.engines import SimpleEngine
+from metagpt.rag.retrievers import SimpleHybridRetriever
+from metagpt.rag.retrievers.base import ModifiableRAGRetriever, PersistableRAGRetriever
+from metagpt.rag.schema import BM25RetrieverConfig, ObjectNode
+
+
+class TestSimpleEngine:
+    @pytest.fixture
+    def mock_llm(self):
+        return MockLLM()
+
+    @pytest.fixture
+    def mock_embedding(self):
+        return MockEmbedding(embed_dim=1)
+
+    @pytest.fixture
+    def mock_simple_directory_reader(self, mocker):
+        return mocker.patch("metagpt.rag.engines.simple.SimpleDirectoryReader")
+
+    @pytest.fixture
+    def mock_vector_store_index(self, mocker):
+        return mocker.patch("metagpt.rag.engines.simple.VectorStoreIndex.from_documents")
+
+    @pytest.fixture
+    def mock_get_retriever(self, mocker):
+        return mocker.patch("metagpt.rag.engines.simple.get_retriever")
+
+    @pytest.fixture
+    def mock_get_rankers(self, mocker):
+        return mocker.patch("metagpt.rag.engines.simple.get_rankers")
+
+    @pytest.fixture
+    def mock_get_response_synthesizer(self, mocker):
+        return mocker.patch("metagpt.rag.engines.simple.get_response_synthesizer")
+
+    def test_from_docs(
+        self,
+        mocker,
+        mock_simple_directory_reader,
+        mock_vector_store_index,
+        mock_get_retriever,
+        mock_get_rankers,
+        mock_get_response_synthesizer,
+    ):
+        # Mock
+        mock_simple_directory_reader.return_value.load_data.return_value = [
+            Document(text="document1"),
+            Document(text="document2"),
+        ]
+        mock_get_retriever.return_value = mocker.MagicMock()
+        mock_get_rankers.return_value = [mocker.MagicMock()]
+        mock_get_response_synthesizer.return_value = mocker.MagicMock()
+
+        # Setup
+        input_dir = "test_dir"
+        input_files = ["test_file1", "test_file2"]
+        transformations = [mocker.MagicMock()]
+        embed_model = mocker.MagicMock()
+        llm = mocker.MagicMock()
+        retriever_configs = [mocker.MagicMock()]
+        ranker_configs = [mocker.MagicMock()]
+
+        # Exec
+        engine = SimpleEngine.from_docs(
+            input_dir=input_dir,
+            input_files=input_files,
+            transformations=transformations,
+            embed_model=embed_model,
+            llm=llm,
+            retriever_configs=retriever_configs,
+            ranker_configs=ranker_configs,
+        )
+
+        # Assert
+        mock_simple_directory_reader.assert_called_once_with(input_dir=input_dir, input_files=input_files)
+        mock_vector_store_index.assert_called_once()
+        mock_get_retriever.assert_called_once_with(
+            configs=retriever_configs, index=mock_vector_store_index.return_value
+        )
+        mock_get_rankers.assert_called_once_with(configs=ranker_configs, llm=llm)
+        mock_get_response_synthesizer.assert_called_once_with(llm=llm)
+        assert isinstance(engine, SimpleEngine)
+
+    def test_from_docs_without_file(self):
+        with pytest.raises(ValueError):
+            SimpleEngine.from_docs()
+
+    def test_from_objs(self, mock_llm, mock_embedding):
+        # Mock
+        class MockRAGObject:
+            def rag_key(self):
+                return "key"
+
+            def model_dump_json(self):
+                return "{}"
+
+        objs = [MockRAGObject()]
+
+        # Setup
+        retriever_configs = []
+        ranker_configs = []
+
+        # Exec
+        engine = SimpleEngine.from_objs(
+            objs=objs,
+            llm=mock_llm,
+            embed_model=mock_embedding,
+            retriever_configs=retriever_configs,
+            ranker_configs=ranker_configs,
+        )
+
+        # Assert
+        assert isinstance(engine, SimpleEngine)
+        assert engine.index is not None
+
+    def test_from_objs_with_bm25_config(self):
+        # Setup
+        retriever_configs = [BM25RetrieverConfig()]
+
+        # Exec
+        with pytest.raises(ValueError):
+            SimpleEngine.from_objs(
+                objs=[],
+                llm=MockLLM(),
+                retriever_configs=retriever_configs,
+                ranker_configs=[],
+            )
+
+    def test_from_index(self, mocker, mock_llm, mock_embedding):
+        # Mock
+        mock_index = mocker.MagicMock(spec=VectorStoreIndex)
+        mock_get_index = mocker.patch("metagpt.rag.engines.simple.get_index")
+        mock_get_index.return_value = mock_index
+
+        # Exec
+        engine = SimpleEngine.from_index(
+            index_config=mock_index,
+            embed_model=mock_embedding,
+            llm=mock_llm,
+        )
+
+        # Assert
+        assert isinstance(engine, SimpleEngine)
+        assert engine.index is mock_index
+
+    @pytest.mark.asyncio
+    async def test_asearch(self, mocker):
+        # Mock
+        test_query = "test query"
+        expected_result = "expected result"
+        mock_aquery = mocker.AsyncMock(return_value=expected_result)
+
+        # Setup
+        engine = SimpleEngine(retriever=mocker.MagicMock())
+        engine.aquery = mock_aquery
+
+        # Exec
+        result = await engine.asearch(test_query)
+
+        # Assert
+        mock_aquery.assert_called_once_with(test_query)
+        assert result == expected_result
+
+    @pytest.mark.asyncio
+    async def test_aretrieve(self, mocker):
+        # Mock
+        mock_query_bundle = mocker.patch("metagpt.rag.engines.simple.QueryBundle", return_value="query_bundle")
+        mock_super_aretrieve = mocker.patch(
+            "metagpt.rag.engines.simple.RetrieverQueryEngine.aretrieve", new_callable=mocker.AsyncMock
+        )
+        mock_super_aretrieve.return_value = [TextNode(text="node_with_score", metadata={"is_obj": False})]
+
+        # Setup
+        engine = SimpleEngine(retriever=mocker.MagicMock())
+        test_query = "test query"
+
+        # Exec
+        result = await engine.aretrieve(test_query)
+
+        # Assert
+        mock_query_bundle.assert_called_once_with(test_query)
+        mock_super_aretrieve.assert_called_once_with("query_bundle")
+        assert result[0].text == "node_with_score"
+
+    def test_add_docs(self, mocker):
+        # Mock
+        mock_simple_directory_reader = mocker.patch("metagpt.rag.engines.simple.SimpleDirectoryReader")
+        mock_simple_directory_reader.return_value.load_data.return_value = [
+            Document(text="document1"),
+            Document(text="document2"),
+        ]
+
+        mock_retriever = mocker.MagicMock(spec=ModifiableRAGRetriever)
+
+        mock_index = mocker.MagicMock(spec=VectorStoreIndex)
+        mock_index._transformations = mocker.MagicMock()
+
+        mock_run_transformations = mocker.patch("metagpt.rag.engines.simple.run_transformations")
+        mock_run_transformations.return_value = ["node1", "node2"]
+
+        # Setup
+        engine = SimpleEngine(retriever=mock_retriever, index=mock_index)
+        input_files = ["test_file1", "test_file2"]
+
+        # Exec
+        engine.add_docs(input_files=input_files)
+
+        # Assert
+        mock_simple_directory_reader.assert_called_once_with(input_files=input_files)
+        mock_retriever.add_nodes.assert_called_once_with(["node1", "node2"])
+
+    def test_add_objs(self, mocker):
+        # Mock
+        mock_retriever = mocker.MagicMock(spec=ModifiableRAGRetriever)
+
+        # Setup
+        class CustomTextNode(TextNode):
+            def rag_key(self):
+                return ""
+
+            def model_dump_json(self):
+                return ""
+
+        objs = [CustomTextNode(text=f"text_{i}", metadata={"obj": f"obj_{i}"}) for i in range(2)]
+        engine = SimpleEngine(retriever=mock_retriever, index=mocker.MagicMock())
+
+        # Exec
+        engine.add_objs(objs=objs)
+
+        # Assert
+        assert mock_retriever.add_nodes.call_count == 1
+        for node in mock_retriever.add_nodes.call_args[0][0]:
+            assert isinstance(node, TextNode)
+            assert "is_obj" in node.metadata
+
+    def test_persist_successfully(self, mocker):
+        # Mock
+        mock_retriever = mocker.MagicMock(spec=PersistableRAGRetriever)
+        mock_retriever.persist.return_value = mocker.MagicMock()
+
+        # Setup
+        engine = SimpleEngine(retriever=mock_retriever)
+
+        # Exec
+        engine.persist(persist_dir="")
+
+    def test_ensure_retriever_of_type(self, mocker):
+        # Mock
+        class MyRetriever:
+            def add_nodes(self):
+                ...
+
+        mock_retriever = mocker.MagicMock(spec=SimpleHybridRetriever)
+        mock_retriever.retrievers = [MyRetriever()]
+
+        # Setup
+        engine = SimpleEngine(retriever=mock_retriever)
+
+        # Assert
+        engine._ensure_retriever_of_type(ModifiableRAGRetriever)
+
+        with pytest.raises(TypeError):
+            engine._ensure_retriever_of_type(PersistableRAGRetriever)
+
+        with pytest.raises(TypeError):
+            other_engine = SimpleEngine(retriever=mocker.MagicMock(spec=ModifiableRAGRetriever))
+            other_engine._ensure_retriever_of_type(PersistableRAGRetriever)
+
+    def test_with_obj_metadata(self, mocker):
+        # Mock
+        node = NodeWithScore(
+            node=ObjectNode(
+                text="example",
+                metadata={
+                    "is_obj": True,
+                    "obj_cls_name": "ExampleObject",
+                    "obj_mod_name": "__main__",
+                    "obj_json": json.dumps({"key": "test_key", "value": "test_value"}),
+                },
+            )
+        )
+
+        class ExampleObject:
+            def __init__(self, key, value):
+                self.key = key
+                self.value = value
+
+            def __eq__(self, other):
+                return self.key == other.key and self.value == other.value
+
+        mock_import_class = mocker.patch("metagpt.rag.engines.simple.import_class")
+        mock_import_class.return_value = ExampleObject
+
+        # Setup
+        SimpleEngine._try_reconstruct_obj([node])
+
+        # Exec
+        expected_obj = ExampleObject(key="test_key", value="test_value")
+
+        # Assert
+        assert "obj" in node.node.metadata
+        assert node.node.metadata["obj"] == expected_obj
diff --git a/tests/metagpt/rag/factories/test_base.py b/tests/metagpt/rag/factories/test_base.py
new file mode 100644
index 000000000..1d41e1872
--- /dev/null
+++ b/tests/metagpt/rag/factories/test_base.py
@@ -0,0 +1,102 @@
+import pytest
+
+from metagpt.rag.factories.base import ConfigBasedFactory, GenericFactory
+
+
+class TestGenericFactory:
+    @pytest.fixture
+    def creators(self):
+        return {
+            "type1": lambda name: f"Instance of type1 with {name}",
+            "type2": lambda name: f"Instance of type2 with {name}",
+        }
+
+    @pytest.fixture
+    def factory(self, creators):
+        return GenericFactory(creators=creators)
+
+    def test_get_instance_success(self, factory):
+        # Test successful retrieval of an instance
+        key = "type1"
+        instance = factory.get_instance(key, name="TestName")
+        assert instance == "Instance of type1 with TestName"
+
+    def test_get_instance_failure(self, factory):
+        # Test failure to retrieve an instance due to unregistered key
+        with pytest.raises(ValueError) as exc_info:
+            factory.get_instance("unknown_key")
+        assert "Creator not registered for key: unknown_key" in str(exc_info.value)
+
+    def test_get_instances_success(self, factory):
+        # Test successful retrieval of multiple instances
+        keys = ["type1", "type2"]
+        instances = factory.get_instances(keys, name="TestName")
+        expected = ["Instance of type1 with TestName", "Instance of type2 with TestName"]
+        assert instances == expected
+
+    @pytest.mark.parametrize(
+        "keys,expected_exception_message",
+        [
+            (["unknown_key"], "Creator not registered for key: unknown_key"),
+            (["type1", "unknown_key"], "Creator not registered for key: unknown_key"),
+        ],
+    )
+    def test_get_instances_with_failure(self, factory, keys, expected_exception_message):
+        # Test failure to retrieve instances due to at least one unregistered key
+        with pytest.raises(ValueError) as exc_info:
+            factory.get_instances(keys, name="TestName")
+        assert expected_exception_message in str(exc_info.value)
+
+
+class DummyConfig:
+    """A dummy config class for testing."""
+
+    def __init__(self, name):
+        self.name = name
+
+
+class TestConfigBasedFactory:
+    @pytest.fixture
+    def config_creators(self):
+        return {
+            DummyConfig: lambda config, **kwargs: f"Processed {config.name} with {kwargs.get('extra', 'no extra')}",
+        }
+
+    @pytest.fixture
+    def config_factory(self, config_creators):
+        return ConfigBasedFactory(creators=config_creators)
+
+    def test_get_instance_success(self, config_factory):
+        # Test successful retrieval of an instance
+        config = DummyConfig(name="TestConfig")
+        instance = config_factory.get_instance(config, extra="additional data")
+        assert instance == "Processed TestConfig with additional data"
+
+    def test_get_instance_failure(self, config_factory):
+        # Test failure to retrieve an instance due to unknown config type
+        class UnknownConfig:
+            pass
+
+        config = UnknownConfig()
+        with pytest.raises(ValueError) as exc_info:
+            config_factory.get_instance(config)
+        assert "Unknown config:" in str(exc_info.value)
+
+    def test_val_from_config_or_kwargs_priority(self):
+        # Test that the value from the config object has priority over kwargs
+        config = DummyConfig(name="ConfigName")
+        result = ConfigBasedFactory._val_from_config_or_kwargs("name", config, name="KwargsName")
+        assert result == "ConfigName"
+
+    def test_val_from_config_or_kwargs_fallback_to_kwargs(self):
+        # Test fallback to kwargs when config object does not have the value
+        config = DummyConfig(name=None)
+        result = ConfigBasedFactory._val_from_config_or_kwargs("name", config, name="KwargsName")
+        assert result == "KwargsName"
+
+    def test_val_from_config_or_kwargs_key_error(self):
+        # Test KeyError when the key is not found in both config object and kwargs
+        config = DummyConfig(name=None)
+        with pytest.raises(KeyError) as exc_info:
+            ConfigBasedFactory._val_from_config_or_kwargs("missing_key", config)
+        assert "The key 'missing_key' is required but not provided" in str(exc_info.value)
diff --git a/tests/metagpt/rag/factories/test_embedding.py b/tests/metagpt/rag/factories/test_embedding.py
new file mode 100644
index 000000000..1ded6b4a8
--- /dev/null
+++ b/tests/metagpt/rag/factories/test_embedding.py
@@ -0,0 +1,43 @@
+import pytest
+
+from metagpt.configs.llm_config import LLMType
+from metagpt.rag.factories.embedding import RAGEmbeddingFactory
+
+
+class TestRAGEmbeddingFactory:
+    @pytest.fixture(autouse=True)
+    def mock_embedding_factory(self):
+        self.embedding_factory = RAGEmbeddingFactory()
+
+    @pytest.fixture
+    def mock_openai_embedding(self, mocker):
+        return mocker.patch("metagpt.rag.factories.embedding.OpenAIEmbedding")
+
+    @pytest.fixture
+    def mock_azure_embedding(self, mocker):
+        return mocker.patch("metagpt.rag.factories.embedding.AzureOpenAIEmbedding")
+
+    def test_get_rag_embedding_openai(self, mock_openai_embedding):
+        # Exec
+        self.embedding_factory.get_rag_embedding(LLMType.OPENAI)
+
+        # Assert
+        mock_openai_embedding.assert_called_once()
+
+    def test_get_rag_embedding_azure(self, mock_azure_embedding):
+        # Exec
+        self.embedding_factory.get_rag_embedding(LLMType.AZURE)
+
+        # Assert
+        mock_azure_embedding.assert_called_once()
+
+    def test_get_rag_embedding_default(self, mocker, mock_openai_embedding):
+        # Mock
+        mock_config = mocker.patch("metagpt.rag.factories.embedding.config")
+        mock_config.llm.api_type = LLMType.OPENAI
+
+        # Exec
+        self.embedding_factory.get_rag_embedding()
+
+        # Assert
+        mock_openai_embedding.assert_called_once()
diff --git a/tests/metagpt/rag/factories/test_index.py b/tests/metagpt/rag/factories/test_index.py
new file mode 100644
index 000000000..9dc5bfb6b
--- /dev/null
+++ b/tests/metagpt/rag/factories/test_index.py
@@ -0,0 +1,89 @@
+import pytest
+from llama_index.core.embeddings import MockEmbedding
+
+from metagpt.rag.factories.index import RAGIndexFactory
+from metagpt.rag.schema import (
+    BM25IndexConfig,
+    ChromaIndexConfig,
+    ElasticsearchIndexConfig,
+    ElasticsearchStoreConfig,
+    FAISSIndexConfig,
+)
+
+
+class TestRAGIndexFactory:
+    @pytest.fixture(autouse=True)
+    def setup(self):
+        self.index_factory = RAGIndexFactory()
+
+    @pytest.fixture
+    def faiss_config(self):
+        return FAISSIndexConfig(persist_path="")
+
+    @pytest.fixture
+    def chroma_config(self):
+        return ChromaIndexConfig(persist_path="", collection_name="")
+
+    @pytest.fixture
+    def bm25_config(self):
+        return BM25IndexConfig(persist_path="")
+
+    @pytest.fixture
+    def es_config(self, mocker):
+        return ElasticsearchIndexConfig(store_config=ElasticsearchStoreConfig())
+
+    @pytest.fixture
+    def mock_storage_context(self, mocker):
+        return mocker.patch("metagpt.rag.factories.index.StorageContext.from_defaults")
+
+    @pytest.fixture
+    def mock_load_index_from_storage(self, mocker):
+        return mocker.patch("metagpt.rag.factories.index.load_index_from_storage")
+
+    @pytest.fixture
+    def mock_from_vector_store(self, mocker):
+        return mocker.patch("metagpt.rag.factories.index.VectorStoreIndex.from_vector_store")
+
+    @pytest.fixture
+    def mock_embedding(self):
+        return MockEmbedding(embed_dim=1)
+
+    def test_create_faiss_index(
+        self, mocker, faiss_config, mock_storage_context, mock_load_index_from_storage, mock_embedding
+    ):
+        # Mock
+        mock_faiss_store = mocker.patch("metagpt.rag.factories.index.FaissVectorStore.from_persist_dir")
+
+        # Exec
+        self.index_factory.get_index(faiss_config, embed_model=mock_embedding)
+
+        # Assert
+        mock_faiss_store.assert_called_once()
+
+    def test_create_bm25_index(
+        self, mocker, bm25_config, mock_storage_context, mock_load_index_from_storage, mock_embedding
+    ):
+        self.index_factory.get_index(bm25_config, embed_model=mock_embedding)
+
+    def test_create_chroma_index(self, mocker, chroma_config, mock_from_vector_store, mock_embedding):
+        # Mock
+        mock_chroma_db = mocker.patch("metagpt.rag.factories.index.chromadb.PersistentClient")
+        mock_chroma_db.get_or_create_collection.return_value = mocker.MagicMock()
+
+        mock_chroma_store = mocker.patch("metagpt.rag.factories.index.ChromaVectorStore")
+
+        # Exec
+        self.index_factory.get_index(chroma_config, embed_model=mock_embedding)
+
+        # Assert
+        mock_chroma_store.assert_called_once()
+
+    def test_create_es_index(self, mocker, es_config, mock_from_vector_store, mock_embedding):
+        # Mock
+        mock_es_store = mocker.patch("metagpt.rag.factories.index.ElasticsearchStore")
+
+        # Exec
+        self.index_factory.get_index(es_config, embed_model=mock_embedding)
+
+        # Assert
+        mock_es_store.assert_called_once()
diff --git a/tests/metagpt/rag/factories/test_llm.py b/tests/metagpt/rag/factories/test_llm.py
new file mode 100644
index 000000000..e11b87076
--- /dev/null
+++ b/tests/metagpt/rag/factories/test_llm.py
@@ -0,0 +1,71 @@
+from typing import Optional, Union
+
+import pytest
+from llama_index.core.llms import LLMMetadata
+
+from metagpt.configs.llm_config import LLMConfig
+from metagpt.const import USE_CONFIG_TIMEOUT
+from metagpt.provider.base_llm import BaseLLM
+from metagpt.rag.factories.llm import RAGLLM, get_rag_llm
+
+
+class MockLLM(BaseLLM):
+    def __init__(self, config: LLMConfig):
+        ...
+
+    async def _achat_completion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT):
+        """_achat_completion implemented by inherited class"""
+
+    async def acompletion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT):
+        return "ok"
+
+    def completion(self, messages: list[dict], timeout=USE_CONFIG_TIMEOUT):
+        return "ok"
+
+    async def _achat_completion_stream(self, messages: list[dict], timeout: int = USE_CONFIG_TIMEOUT) -> str:
+        """_achat_completion_stream implemented by inherited class"""
+
+    async def aask(
+        self,
+        msg: Union[str, list[dict[str, str]]],
+        system_msgs: Optional[list[str]] = None,
+        format_msgs: Optional[list[dict[str, str]]] = None,
+        images: Optional[Union[str, list[str]]] = None,
+        timeout=USE_CONFIG_TIMEOUT,
+        stream=True,
+    ) -> str:
+        return "ok"
+
+
+class TestRAGLLM:
+    @pytest.fixture
+    def mock_model_infer(self):
+        return MockLLM(config=LLMConfig())
+
+    @pytest.fixture
+    def rag_llm(self, mock_model_infer):
+        return RAGLLM(model_infer=mock_model_infer)
+
+    def test_metadata(self, rag_llm):
+        metadata = rag_llm.metadata
+        assert isinstance(metadata, LLMMetadata)
+        assert metadata.context_window == rag_llm.context_window
+        assert metadata.num_output == rag_llm.num_output
+        assert metadata.model_name == rag_llm.model_name
+
+    @pytest.mark.asyncio
+    async def test_acomplete(self, rag_llm, mock_model_infer):
+        response = await rag_llm.acomplete("question")
+        assert response.text == "ok"
+
+    def test_complete(self, rag_llm, mock_model_infer):
+        response = rag_llm.complete("question")
+        assert response.text == "ok"
+
+    def test_stream_complete(self, rag_llm, mock_model_infer):
+        rag_llm.stream_complete("question")
+
+
+def test_get_rag_llm():
+    result = get_rag_llm(MockLLM(config=LLMConfig()))
+    assert isinstance(result, RAGLLM)
diff --git a/tests/metagpt/rag/factories/test_ranker.py b/tests/metagpt/rag/factories/test_ranker.py
new file mode 100644
index 000000000..e40f7f8df
--- /dev/null
+++ b/tests/metagpt/rag/factories/test_ranker.py
@@ -0,0 +1,60 @@
+import contextlib
+
+import pytest
+from llama_index.core.llms import MockLLM
+from llama_index.core.postprocessor import LLMRerank
+
+from metagpt.rag.factories.ranker import RankerFactory
+from metagpt.rag.schema import ColbertRerankConfig, LLMRankerConfig, ObjectRankerConfig
+
+
+class TestRankerFactory:
+    @pytest.fixture(autouse=True)
+    def ranker_factory(self):
+        self.ranker_factory: RankerFactory = RankerFactory()
+
+    @pytest.fixture
+    def mock_llm(self):
+        return MockLLM()
+
+    def test_get_rankers_with_no_configs(self, mock_llm, mocker):
+        mocker.patch.object(self.ranker_factory, "_extract_llm", return_value=mock_llm)
+        default_rankers = self.ranker_factory.get_rankers()
+        assert len(default_rankers) == 0
+
+    def test_get_rankers_with_configs(self, mock_llm):
+        mock_config = LLMRankerConfig(llm=mock_llm)
+        rankers = self.ranker_factory.get_rankers(configs=[mock_config])
+        assert len(rankers) == 1
+        assert isinstance(rankers[0], LLMRerank)
+
+    def test_extract_llm_from_config(self, mock_llm):
+        mock_config = LLMRankerConfig(llm=mock_llm)
+        extracted_llm = self.ranker_factory._extract_llm(config=mock_config)
+        assert extracted_llm == mock_llm
+
+    def test_extract_llm_from_kwargs(self, mock_llm):
+        extracted_llm = self.ranker_factory._extract_llm(llm=mock_llm)
+        assert extracted_llm == mock_llm
+
+    def test_create_llm_ranker(self, mock_llm):
+        mock_config = LLMRankerConfig(llm=mock_llm)
+        ranker = self.ranker_factory._create_llm_ranker(mock_config)
+        assert isinstance(ranker, LLMRerank)
+
+    def test_create_colbert_ranker(self, mocker, mock_llm):
+        with contextlib.suppress(ImportError):
+            mocker.patch("llama_index.postprocessor.colbert_rerank.ColbertRerank", return_value="colbert")
+
+            mock_config = ColbertRerankConfig(llm=mock_llm)
+            ranker = self.ranker_factory._create_colbert_ranker(mock_config)
+
+            assert ranker == "colbert"
+
+    def test_create_object_ranker(self, mocker, mock_llm):
+        mocker.patch("metagpt.rag.factories.ranker.ObjectSortPostprocessor", return_value="object")
+
+        mock_config = ObjectRankerConfig(field_name="fake", llm=mock_llm)
+        ranker = self.ranker_factory._create_object_ranker(mock_config)
+
+        assert ranker == "object"
diff --git a/tests/metagpt/rag/factories/test_retriever.py b/tests/metagpt/rag/factories/test_retriever.py
new file mode 100644
index 000000000..ef1cef7e0
--- /dev/null
+++ b/tests/metagpt/rag/factories/test_retriever.py
@@ -0,0 +1,113 @@
+import faiss
+import pytest
+from llama_index.core import VectorStoreIndex
+from llama_index.vector_stores.chroma import ChromaVectorStore
+from llama_index.vector_stores.elasticsearch import ElasticsearchStore
+
+from metagpt.rag.factories.retriever import RetrieverFactory
+from metagpt.rag.retrievers.bm25_retriever import DynamicBM25Retriever
+from metagpt.rag.retrievers.chroma_retriever import ChromaRetriever
+from metagpt.rag.retrievers.es_retriever import ElasticsearchRetriever
+from metagpt.rag.retrievers.faiss_retriever import FAISSRetriever
+from metagpt.rag.retrievers.hybrid_retriever import SimpleHybridRetriever
+from metagpt.rag.schema import (
+    BM25RetrieverConfig,
+    ChromaRetrieverConfig,
+    ElasticsearchRetrieverConfig,
+    ElasticsearchStoreConfig,
+    FAISSRetrieverConfig,
+)
+
+
+class TestRetrieverFactory:
+    @pytest.fixture(autouse=True)
+    def retriever_factory(self):
+        self.retriever_factory: RetrieverFactory = RetrieverFactory()
+
+    @pytest.fixture
+    def mock_faiss_index(self, mocker):
+        return mocker.MagicMock(spec=faiss.IndexFlatL2)
+
+    @pytest.fixture
+    def mock_vector_store_index(self, mocker):
+        mock = mocker.MagicMock(spec=VectorStoreIndex)
+        mock._embed_model = mocker.MagicMock()
+        mock.docstore.docs.values.return_value = []
+        return mock
+
+    @pytest.fixture
+    def mock_chroma_vector_store(self, mocker):
+        return mocker.MagicMock(spec=ChromaVectorStore)
+
+    @pytest.fixture
+    def mock_es_vector_store(self, mocker):
+        return mocker.MagicMock(spec=ElasticsearchStore)
+
+    def test_get_retriever_with_faiss_config(self, mock_faiss_index, mocker, mock_vector_store_index):
+        mock_config = FAISSRetrieverConfig(dimensions=128)
+        mocker.patch("faiss.IndexFlatL2", return_value=mock_faiss_index)
+        mocker.patch.object(self.retriever_factory, "_extract_index", return_value=mock_vector_store_index)
+
+        retriever = self.retriever_factory.get_retriever(configs=[mock_config])
+
+        assert isinstance(retriever, FAISSRetriever)
+
+    def test_get_retriever_with_bm25_config(self, mocker, mock_vector_store_index):
+        mock_config = BM25RetrieverConfig()
+        mocker.patch("rank_bm25.BM25Okapi.__init__", return_value=None)
+        mocker.patch.object(self.retriever_factory, "_extract_index", return_value=mock_vector_store_index)
+
+        retriever = self.retriever_factory.get_retriever(configs=[mock_config])
+
+        assert isinstance(retriever, DynamicBM25Retriever)
+
+    def test_get_retriever_with_multiple_configs_returns_hybrid(self, mocker, mock_vector_store_index):
+        mock_faiss_config = FAISSRetrieverConfig(dimensions=128)
+        mock_bm25_config = BM25RetrieverConfig()
+        mocker.patch("rank_bm25.BM25Okapi.__init__", return_value=None)
+        mocker.patch.object(self.retriever_factory, "_extract_index", return_value=mock_vector_store_index)
+
+        retriever = self.retriever_factory.get_retriever(configs=[mock_faiss_config, mock_bm25_config])
+
+        assert isinstance(retriever, SimpleHybridRetriever)
+
+    def test_get_retriever_with_chroma_config(self, mocker, mock_vector_store_index, mock_chroma_vector_store):
+        mock_config = ChromaRetrieverConfig(persist_path="/path/to/chroma", collection_name="test_collection")
+        mock_chromadb = mocker.patch("metagpt.rag.factories.retriever.chromadb.PersistentClient")
+        mock_chromadb.get_or_create_collection.return_value = mocker.MagicMock()
+        mocker.patch("metagpt.rag.factories.retriever.ChromaVectorStore", return_value=mock_chroma_vector_store)
+        mocker.patch.object(self.retriever_factory, "_extract_index", return_value=mock_vector_store_index)
+
+        retriever = self.retriever_factory.get_retriever(configs=[mock_config])
+
+        assert isinstance(retriever, ChromaRetriever)
+
+    def test_get_retriever_with_es_config(self, mocker, mock_vector_store_index, mock_es_vector_store):
+        mock_config = ElasticsearchRetrieverConfig(store_config=ElasticsearchStoreConfig())
+        mocker.patch("metagpt.rag.factories.retriever.ElasticsearchStore", return_value=mock_es_vector_store)
+        mocker.patch.object(self.retriever_factory, "_extract_index", return_value=mock_vector_store_index)
+
+        retriever = self.retriever_factory.get_retriever(configs=[mock_config])
+
+        assert isinstance(retriever, ElasticsearchRetriever)
+
+    def test_create_default_retriever(self, mocker, mock_vector_store_index):
+        mocker.patch.object(self.retriever_factory, "_extract_index", return_value=mock_vector_store_index)
+        mock_vector_store_index.as_retriever = mocker.MagicMock()
+
+        retriever = self.retriever_factory.get_retriever()
+
+        mock_vector_store_index.as_retriever.assert_called_once()
+        assert retriever is mock_vector_store_index.as_retriever.return_value
+
+    def test_extract_index_from_config(self, mock_vector_store_index):
+        mock_config = FAISSRetrieverConfig(index=mock_vector_store_index)
+
+        extracted_index = self.retriever_factory._extract_index(config=mock_config)
+
+        assert extracted_index == mock_vector_store_index
+
+    def test_extract_index_from_kwargs(self, mock_vector_store_index):
+        extracted_index = self.retriever_factory._extract_index(index=mock_vector_store_index)
+
+        assert extracted_index == mock_vector_store_index
diff --git a/tests/metagpt/rag/rankers/test_base_ranker.py b/tests/metagpt/rag/rankers/test_base_ranker.py
new file mode 100644
index 000000000..9755949f6
--- /dev/null
+++ b/tests/metagpt/rag/rankers/test_base_ranker.py
@@ -0,0 +1,23 @@
+import pytest
+from llama_index.core.schema import NodeWithScore, QueryBundle, TextNode
+
+from metagpt.rag.rankers.base import RAGRanker
+
+
+class SimpleRAGRanker(RAGRanker):
+    def _postprocess_nodes(self, nodes, query_bundle=None):
+        return [NodeWithScore(node=node.node, score=node.score + 1) for node in nodes]
+
+
+class TestSimpleRAGRanker:
+    @pytest.fixture
+    def ranker(self):
+        return SimpleRAGRanker()
+
+    def test_postprocess_nodes_increases_scores(self, ranker):
+        nodes = [NodeWithScore(node=TextNode(text="a"), score=10), NodeWithScore(node=TextNode(text="b"), score=20)]
+        query_bundle = QueryBundle(query_str="test query")
+
+        processed_nodes = ranker._postprocess_nodes(nodes, query_bundle)
+
+        assert all(node.score == original_node.score + 1 for node, original_node in zip(processed_nodes, nodes))
diff --git a/tests/metagpt/rag/rankers/test_object_ranker.py b/tests/metagpt/rag/rankers/test_object_ranker.py
new file mode 100644
index 000000000..4a9f66a42
--- /dev/null
+++ b/tests/metagpt/rag/rankers/test_object_ranker.py
@@ -0,0 +1,69 @@
+import json
+
+import pytest
+from llama_index.core.schema import NodeWithScore, QueryBundle
+from pydantic import BaseModel
+
+from metagpt.rag.rankers.object_ranker import ObjectSortPostprocessor
+from metagpt.rag.schema import ObjectNode
+
+
+class Record(BaseModel):
+    score: int
+
+
+class TestObjectSortPostprocessor:
+    @pytest.fixture
+    def mock_nodes_with_scores(self):
+        nodes = [
+            NodeWithScore(node=ObjectNode(metadata={"obj_json": Record(score=10).model_dump_json()}), score=10),
+            NodeWithScore(node=ObjectNode(metadata={"obj_json": Record(score=20).model_dump_json()}), score=20),
+            NodeWithScore(node=ObjectNode(metadata={"obj_json": Record(score=5).model_dump_json()}), score=5),
+        ]
+        return nodes
+
+    @pytest.fixture
+    def mock_query_bundle(self, mocker):
+        return mocker.MagicMock(spec=QueryBundle)
+
+    def test_sort_descending(self, mock_nodes_with_scores, mock_query_bundle):
+        postprocessor = ObjectSortPostprocessor(field_name="score", order="desc")
+        sorted_nodes = postprocessor._postprocess_nodes(mock_nodes_with_scores, mock_query_bundle)
+        assert [node.score for node in sorted_nodes] == [20, 10, 5]
+
+    def test_sort_ascending(self, mock_nodes_with_scores, mock_query_bundle):
+        postprocessor = ObjectSortPostprocessor(field_name="score", order="asc")
+        sorted_nodes = postprocessor._postprocess_nodes(mock_nodes_with_scores, mock_query_bundle)
+        assert [node.score for node in sorted_nodes] == [5, 10, 20]
+
+    def test_top_n_limit(self, mock_nodes_with_scores, mock_query_bundle):
+        postprocessor = ObjectSortPostprocessor(field_name="score", order="desc", top_n=2)
+        sorted_nodes = postprocessor._postprocess_nodes(mock_nodes_with_scores, mock_query_bundle)
+        assert len(sorted_nodes) == 2
+        assert [node.score for node in sorted_nodes] == [20, 10]
+
+    def test_invalid_json_metadata(self, mock_query_bundle):
+        nodes = [NodeWithScore(node=ObjectNode(metadata={"obj_json": "invalid_json"}), score=10)]
+        postprocessor = ObjectSortPostprocessor(field_name="score", order="desc")
+        with pytest.raises(ValueError):
+            postprocessor._postprocess_nodes(nodes, mock_query_bundle)
+
+    def test_missing_query_bundle(self, mock_nodes_with_scores):
+        postprocessor = ObjectSortPostprocessor(field_name="score", order="desc")
+        with pytest.raises(ValueError):
+            postprocessor._postprocess_nodes(mock_nodes_with_scores, query_bundle=None)
+
+    def test_field_not_found_in_object(self, mock_query_bundle):
+        nodes = [NodeWithScore(node=ObjectNode(metadata={"obj_json": json.dumps({"not_score": 10})}), score=10)]
+        postprocessor = ObjectSortPostprocessor(field_name="score", order="desc")
+        with pytest.raises(ValueError):
+            postprocessor._postprocess_nodes(nodes, query_bundle=mock_query_bundle)
+
+    def test_not_nodes(self, mock_query_bundle):
+        nodes = []
+        postprocessor = ObjectSortPostprocessor(field_name="score", order="desc")
+        result = postprocessor._postprocess_nodes(nodes, mock_query_bundle)
+        assert result == []
+
+    def test_class_name(self):
+        assert ObjectSortPostprocessor.class_name() == "ObjectSortPostprocessor"
diff --git a/tests/metagpt/rag/retrievers/test_base_retriever.py b/tests/metagpt/rag/retrievers/test_base_retriever.py
new file mode 100644
index 000000000..1065b9731
--- /dev/null
+++ b/tests/metagpt/rag/retrievers/test_base_retriever.py
@@ -0,0 +1,21 @@
+from metagpt.rag.retrievers.base import ModifiableRAGRetriever, PersistableRAGRetriever
+
+
+class SubModifiableRAGRetriever(ModifiableRAGRetriever):
+    ...
+
+
+class SubPersistableRAGRetriever(PersistableRAGRetriever):
+    ...
+
+
+class TestModifiableRAGRetriever:
+    def test_subclasshook(self):
+        result = SubModifiableRAGRetriever.__subclasshook__(SubModifiableRAGRetriever)
+        assert result is NotImplemented
+
+
+class TestPersistableRAGRetriever:
+    def test_subclasshook(self):
+        result = SubPersistableRAGRetriever.__subclasshook__(SubPersistableRAGRetriever)
+        assert result is NotImplemented
diff --git a/tests/metagpt/rag/retrievers/test_bm25_retriever.py b/tests/metagpt/rag/retrievers/test_bm25_retriever.py
new file mode 100644
index 000000000..5a569f103
--- /dev/null
+++ b/tests/metagpt/rag/retrievers/test_bm25_retriever.py
@@ -0,0 +1,37 @@
+import pytest
+from llama_index.core import VectorStoreIndex
+from llama_index.core.schema import Node
+
+from metagpt.rag.retrievers.bm25_retriever import DynamicBM25Retriever
+
+
+class TestDynamicBM25Retriever:
+    @pytest.fixture(autouse=True)
+    def setup(self, mocker):
+        self.doc1 = mocker.MagicMock(spec=Node)
+        self.doc1.get_content.return_value = "Document content 1"
+        self.doc2 = mocker.MagicMock(spec=Node)
+        self.doc2.get_content.return_value = "Document content 2"
+        self.mock_nodes = [self.doc1, self.doc2]
+
+        index = mocker.MagicMock(spec=VectorStoreIndex)
+        index.storage_context.persist.return_value = "ok"
+
+        mock_nodes = []
+        mock_tokenizer = mocker.MagicMock()
+        self.mock_bm25okapi = mocker.patch("rank_bm25.BM25Okapi.__init__", return_value=None)
+
+        self.retriever = DynamicBM25Retriever(nodes=mock_nodes, tokenizer=mock_tokenizer, index=index)
+
+    def test_add_docs_updates_nodes_and_corpus(self):
+        # Exec
+        self.retriever.add_nodes(self.mock_nodes)
+
+        # Assert
+        assert len(self.retriever._nodes) == len(self.mock_nodes)
+        assert len(self.retriever._corpus) == len(self.mock_nodes)
+        self.retriever._tokenizer.assert_called()
+        self.mock_bm25okapi.assert_called()
+
+    def test_persist(self):
+        self.retriever.persist("")
diff --git a/tests/metagpt/rag/retrievers/test_chroma_retriever.py b/tests/metagpt/rag/retrievers/test_chroma_retriever.py
new file mode 100644
index 000000000..cf07903cf
--- /dev/null
+++ b/tests/metagpt/rag/retrievers/test_chroma_retriever.py
@@ -0,0 +1,20 @@
+import pytest
+from llama_index.core.schema import Node
+
+from metagpt.rag.retrievers.chroma_retriever import ChromaRetriever
+
+
+class TestChromaRetriever:
+    @pytest.fixture(autouse=True)
+    def setup(self, mocker):
+        self.doc1 = mocker.MagicMock(spec=Node)
+        self.doc2 = mocker.MagicMock(spec=Node)
+        self.mock_nodes = [self.doc1, self.doc2]
+
+        self.mock_index = mocker.MagicMock()
+        self.retriever = ChromaRetriever(self.mock_index)
+
+    def test_add_nodes(self):
+        self.retriever.add_nodes(self.mock_nodes)
+
+        self.mock_index.insert_nodes.assert_called()
diff --git a/tests/metagpt/rag/retrievers/test_es_retriever.py b/tests/metagpt/rag/retrievers/test_es_retriever.py
new file mode 100644
index 000000000..1824bfbd2
--- /dev/null
+++ b/tests/metagpt/rag/retrievers/test_es_retriever.py
@@ -0,0 +1,20 @@
+import pytest
+from llama_index.core.schema import Node
+
+from metagpt.rag.retrievers.es_retriever import ElasticsearchRetriever
+
+
+class TestElasticsearchRetriever:
+    @pytest.fixture(autouse=True)
+    def setup(self, mocker):
+        self.doc1 = mocker.MagicMock(spec=Node)
+        self.doc2 = mocker.MagicMock(spec=Node)
+        self.mock_nodes = [self.doc1, self.doc2]
+
+        self.mock_index = mocker.MagicMock()
+        self.retriever = ElasticsearchRetriever(self.mock_index)
+
+    def test_add_nodes(self):
+        self.retriever.add_nodes(self.mock_nodes)
+
+        self.mock_index.insert_nodes.assert_called()
diff --git a/tests/metagpt/rag/retrievers/test_faiss_retriever.py b/tests/metagpt/rag/retrievers/test_faiss_retriever.py
new file mode 100644
index 000000000..854673215
--- /dev/null
+++ b/tests/metagpt/rag/retrievers/test_faiss_retriever.py
@@ -0,0 +1,25 @@
+import pytest
+from llama_index.core.schema import Node
+
+from metagpt.rag.retrievers.faiss_retriever import FAISSRetriever
+
+
+class TestFAISSRetriever:
+    @pytest.fixture(autouse=True)
+    def setup(self, mocker):
+        self.doc1 = mocker.MagicMock(spec=Node)
+        self.doc2 = mocker.MagicMock(spec=Node)
+        self.mock_nodes = [self.doc1, self.doc2]
+
+        self.mock_index = mocker.MagicMock()
+        self.retriever = FAISSRetriever(self.mock_index)
+
+    def test_add_docs_calls_insert_for_each_document(self):
+        self.retriever.add_nodes(self.mock_nodes)
+
+        self.mock_index.insert_nodes.assert_called()
+
+    def test_persist(self):
+        self.retriever.persist("")
+
+        self.mock_index.storage_context.persist.assert_called()
diff --git a/tests/metagpt/rag/retrievers/test_hybrid_retriever.py b/tests/metagpt/rag/retrievers/test_hybrid_retriever.py
new file mode 100644
index 000000000..da150d879
--- /dev/null
+++ b/tests/metagpt/rag/retrievers/test_hybrid_retriever.py
@@ -0,0 +1,57 @@
+import pytest
+from llama_index.core.schema import NodeWithScore, TextNode
+
+from metagpt.rag.retrievers import SimpleHybridRetriever
+
+
+class TestSimpleHybridRetriever:
+    @pytest.fixture
+    def mock_retriever(self, mocker):
+        return mocker.MagicMock()
+
+    @pytest.fixture
+    def mock_hybrid_retriever(self, mock_retriever) -> SimpleHybridRetriever:
+        return SimpleHybridRetriever(mock_retriever)
+
+    @pytest.fixture
+    def mock_node(self):
+        return NodeWithScore(node=TextNode(id_="2"), score=0.95)
+
+    @pytest.mark.asyncio
+    async def test_aretrieve(self, mocker):
+        question = "test query"
+
+        # Create mock retrievers
+        mock_retriever1 = mocker.AsyncMock()
+        mock_retriever1.aretrieve.return_value = [
+            NodeWithScore(node=TextNode(id_="1"), score=1.0),
+            NodeWithScore(node=TextNode(id_="2"), score=0.95),
+        ]
+
+        mock_retriever2 = mocker.AsyncMock()
+        mock_retriever2.aretrieve.return_value = [
+            NodeWithScore(node=TextNode(id_="2"), score=0.95),
+            NodeWithScore(node=TextNode(id_="3"), score=0.8),
+        ]
+
+        # Instantiate the SimpleHybridRetriever with the mock retrievers
+        hybrid_retriever = SimpleHybridRetriever(mock_retriever1, mock_retriever2)
+
+        # Call the _aretrieve method
+        results = await hybrid_retriever._aretrieve(question)
+
+        # Check if the results are as expected
+        assert len(results) == 3  # Should be 3 unique nodes
+        assert set(node.node.node_id for node in results) == {"1", "2", "3"}
+
+        # Check if the scores are correct (assuming you want the highest score)
+        node_scores = {node.node.node_id: node.score for node in results}
+        assert node_scores["2"] == 0.95
+
+    def test_add_nodes(self, mock_hybrid_retriever: SimpleHybridRetriever, mock_node):
+        mock_hybrid_retriever.add_nodes([mock_node])
+        mock_hybrid_retriever.retrievers[0].add_nodes.assert_called_once()
+
+    def test_persist(self, mock_hybrid_retriever: SimpleHybridRetriever):
+        mock_hybrid_retriever.persist("")
+        mock_hybrid_retriever.retrievers[0].persist.assert_called_once()
diff --git a/tests/metagpt/roles/test_tutorial_assistant.py b/tests/metagpt/roles/test_tutorial_assistant.py
index c12c2b26e..732f346fd 100644
--- a/tests/metagpt/roles/test_tutorial_assistant.py
+++ b/tests/metagpt/roles/test_tutorial_assistant.py
@@ -6,11 +6,11 @@
 @File    : test_tutorial_assistant.py
 """
 
-import aiofiles
 import pytest
 
 from metagpt.const import TUTORIAL_PATH
 from metagpt.roles.tutorial_assistant import TutorialAssistant
+from metagpt.utils.common import aread
 
 
 @pytest.mark.asyncio
@@ -20,9 +20,8 @@ async def test_tutorial_assistant(language: str, topic: str, context):
     msg = await role.run(topic)
     assert TUTORIAL_PATH.exists()
     filename = msg.content
-    async with aiofiles.open(filename, mode="r", encoding="utf-8") as reader:
-        content = await reader.read()
-        assert "pip" in content
+    content = await aread(filename=filename)
+    assert "pip" in content
 
 
 if __name__ == "__main__":
diff --git a/tests/metagpt/tools/libs/test_web_scraping.py b/tests/metagpt/tools/libs/test_web_scraping.py
index c11960e68..3d8877b8d 100644
--- a/tests/metagpt/tools/libs/test_web_scraping.py
+++ b/tests/metagpt/tools/libs/test_web_scraping.py
@@ -4,8 +4,8 @@ from metagpt.tools.libs.web_scraping import scrape_web_playwright
 
 
 @pytest.mark.asyncio
-async def test_scrape_web_playwright():
-    test_url = "https://www.deepwisdom.ai"
+async def test_scrape_web_playwright(http_server):
+    server, test_url = await http_server()
 
     result = await scrape_web_playwright(test_url)
 
@@ -21,3 +21,4 @@ async def test_scrape_web_playwright():
     assert not result["inner_text"].endswith(" ")
     assert not result["html"].startswith(" ")
     assert not result["html"].endswith(" ")
+    await server.stop()
diff --git a/tests/metagpt/tools/test_search_engine.py b/tests/metagpt/tools/test_search_engine.py
index a1f03ef7b..498d3974d 100644
--- a/tests/metagpt/tools/test_search_engine.py
+++ b/tests/metagpt/tools/test_search_engine.py
@@ -11,7 +11,6 @@ from typing import Callable
 
 import pytest
 
-from metagpt.config2 import config
 from metagpt.configs.search_config import SearchConfig
 from metagpt.logs import logger
 from metagpt.tools import SearchEngineType
@@ -38,6 +37,7 @@ class MockSearchEnine:
         (SearchEngineType.SERPER_GOOGLE, None, 6, False),
         (SearchEngineType.DUCK_DUCK_GO, None, 8, True),
         (SearchEngineType.DUCK_DUCK_GO, None, 6, False),
+        (SearchEngineType.BING, None, 6, False),
         (SearchEngineType.CUSTOM_ENGINE, MockSearchEnine().run, 8, False),
         (SearchEngineType.CUSTOM_ENGINE, MockSearchEnine().run, 6, False),
     ],
@@ -53,14 +53,11 @@ async def test_search_engine(
     search_engine_config = {"engine": search_engine_type, "run_func": run_func}
 
     if search_engine_type is SearchEngineType.SERPAPI_GOOGLE:
-        assert config.search
         search_engine_config["api_key"] = "mock-serpapi-key"
     elif search_engine_type is SearchEngineType.DIRECT_GOOGLE:
-        assert config.search
         search_engine_config["api_key"] = "mock-google-key"
         search_engine_config["cse_id"] = "mock-google-cse"
     elif search_engine_type is SearchEngineType.SERPER_GOOGLE:
-        assert config.search
         search_engine_config["api_key"] = "mock-serper-key"
 
     async def test(search_engine):
diff --git a/tests/metagpt/tools/test_web_browser_engine.py b/tests/metagpt/tools/test_web_browser_engine.py
index ceebd67fc..7a344e0ad 100644
--- a/tests/metagpt/tools/test_web_browser_engine.py
+++ b/tests/metagpt/tools/test_web_browser_engine.py
@@ -9,14 +9,16 @@ from metagpt.utils.parse_html import WebPage
 
 @pytest.mark.asyncio
 @pytest.mark.parametrize(
-    "browser_type, url, urls",
+    "browser_type",
     [
-        (WebBrowserEngineType.PLAYWRIGHT, "https://deepwisdom.ai", ("https://deepwisdom.ai",)),
-        (WebBrowserEngineType.SELENIUM, "https://deepwisdom.ai", ("https://deepwisdom.ai",)),
+        WebBrowserEngineType.PLAYWRIGHT,
+        WebBrowserEngineType.SELENIUM,
     ],
     ids=["playwright", "selenium"],
 )
-async def test_scrape_web_page(browser_type, url, urls):
+async def test_scrape_web_page(browser_type, http_server):
+    server, url = await http_server()
+    urls = [url, url, url]
     browser = web_browser_engine.WebBrowserEngine(engine=browser_type)
     result = await browser.run(url)
     assert isinstance(result, WebPage)
@@ -27,6 +29,7 @@ async def test_scrape_web_page(browser_type, url, urls):
         assert isinstance(results, list)
         assert len(results) == len(urls) + 1
         assert all(("MetaGPT" in i.inner_text) for i in results)
+    await server.stop()
 
 
 if __name__ == "__main__":
diff --git a/tests/metagpt/tools/test_web_browser_engine_playwright.py b/tests/metagpt/tools/test_web_browser_engine_playwright.py
index f35848cf4..12ea96d7b 100644
--- a/tests/metagpt/tools/test_web_browser_engine_playwright.py
+++ b/tests/metagpt/tools/test_web_browser_engine_playwright.py
@@ -9,18 +9,28 @@ from metagpt.utils.parse_html import WebPage
 
 @pytest.mark.asyncio
 @pytest.mark.parametrize(
-    "browser_type, use_proxy, kwagrs, url, urls",
+    "browser_type, use_proxy, kwagrs,",
     [
-        ("chromium", {"proxy": True}, {}, "https://www.deepwisdom.ai", ("https://www.deepwisdom.ai",)),
-        ("firefox", {}, {"ignore_https_errors": True}, "https://www.deepwisdom.ai", ("https://www.deepwisdom.ai",)),
-        ("webkit", {}, {"ignore_https_errors": True}, "https://www.deepwisdom.ai", ("https://www.deepwisdom.ai",)),
+        ("chromium", {"proxy": True}, {}),
+        (
+            "firefox",
+            {},
+            {"ignore_https_errors": True},
+        ),
+        (
+            "webkit",
+            {},
+            {"ignore_https_errors": True},
+        ),
     ],
     ids=["chromium-normal", "firefox-normal", "webkit-normal"],
 )
-async def test_scrape_web_page(browser_type, use_proxy, kwagrs, url, urls, proxy, capfd):
+async def test_scrape_web_page(browser_type, use_proxy, kwagrs, proxy, capfd, http_server):
+    server, url = await http_server()
+    urls = [url, url, url]
     proxy_url = None
     if use_proxy:
-        server, proxy_url = await proxy()
+        proxy_server, proxy_url = await proxy()
     browser = web_browser_engine_playwright.PlaywrightWrapper(browser_type=browser_type, proxy=proxy_url, **kwagrs)
     result = await browser.run(url)
     assert isinstance(result, WebPage)
@@ -32,8 +42,10 @@ async def test_scrape_web_page(browser_type, use_proxy, kwagrs, url, urls, proxy
         assert len(results) == len(urls) + 1
         assert all(("MetaGPT" in i.inner_text) for i in results)
     if use_proxy:
-        server.close()
+        proxy_server.close()
+        await proxy_server.wait_closed()
         assert "Proxy:" in capfd.readouterr().out
+    await server.stop()
 
 
 if __name__ == "__main__":
diff --git a/tests/metagpt/tools/test_web_browser_engine_selenium.py b/tests/metagpt/tools/test_web_browser_engine_selenium.py
index a88a5d0f4..a214748bd 100644
--- a/tests/metagpt/tools/test_web_browser_engine_selenium.py
+++ b/tests/metagpt/tools/test_web_browser_engine_selenium.py
@@ -1,6 +1,7 @@
 #!/usr/bin/env python
 # -*- coding: utf-8 -*-
 
+
 import browsers
 import pytest
 
@@ -10,51 +11,48 @@ from metagpt.utils.parse_html import WebPage
 
 @pytest.mark.asyncio
 @pytest.mark.parametrize(
-    "browser_type, use_proxy, url, urls",
+    "browser_type, use_proxy,",
     [
         pytest.param(
             "chrome",
-            True,
-            "https://deepwisdom.ai",
-            ("https://deepwisdom.ai",),
+            False,
             marks=pytest.mark.skipif(not browsers.get("chrome"), reason="chrome browser not found"),
         ),
         pytest.param(
             "firefox",
             False,
-            "https://deepwisdom.ai",
-            ("https://deepwisdom.ai",),
             marks=pytest.mark.skipif(not browsers.get("firefox"), reason="firefox browser not found"),
         ),
         pytest.param(
             "edge",
             False,
-            "https://deepwisdom.ai",
-            ("https://deepwisdom.ai",),
             marks=pytest.mark.skipif(not browsers.get("msedge"), reason="edge browser not found"),
         ),
     ],
     ids=["chrome-normal", "firefox-normal", "edge-normal"],
 )
-async def test_scrape_web_page(browser_type, use_proxy, url, urls, proxy, capfd):
+async def test_scrape_web_page(browser_type, use_proxy, proxy, capfd, http_server):
     # Prerequisites
     # firefox, chrome, Microsoft Edge
+    server, url = await http_server()
+    urls = [url, url, url]
     proxy_url = None
     if use_proxy:
-        server, proxy_url = await proxy()
+        proxy_server, proxy_url = await proxy()
     browser = web_browser_engine_selenium.SeleniumWrapper(browser_type=browser_type, proxy=proxy_url)
     result = await browser.run(url)
     assert isinstance(result, WebPage)
     assert "MetaGPT" in result.inner_text
 
-    if urls:
-        results = await browser.run(url, *urls)
-        assert isinstance(results, list)
-        assert len(results) == len(urls) + 1
-        assert all(("MetaGPT" in i.inner_text) for i in results)
+    results = await browser.run(url, *urls)
+    assert isinstance(results, list)
+    assert len(results) == len(urls) + 1
+    assert all(("MetaGPT" in i.inner_text) for i in results)
     if use_proxy:
-        server.close()
-        assert "Proxy:" in capfd.readouterr().out
+        proxy_server.close()
+        await proxy_server.wait_closed()
+        assert "Proxy: localhost" in capfd.readouterr().out
+    await server.stop()
 
 
 if __name__ == "__main__":
diff --git a/tests/metagpt/utils/test_common.py b/tests/metagpt/utils/test_common.py
index b365f424f..75e8ef4ad 100644
--- a/tests/metagpt/utils/test_common.py
+++ b/tests/metagpt/utils/test_common.py
@@ -13,7 +13,6 @@ import uuid
 from pathlib import Path
 from typing import Any, Set
 
-import aiofiles
 import pytest
 from pydantic import BaseModel
 
@@ -125,9 +124,7 @@ class TestGetProjectRoot:
     async def test_parse_data_exception(self, filename, want):
         pathname = Path(__file__).parent.parent.parent / "data/output_parser" / filename
         assert pathname.exists()
-        async with aiofiles.open(str(pathname), mode="r") as reader:
-            data = await reader.read()
-
+        data = await aread(filename=pathname)
         result = OutputParser.parse_data(data=data)
         assert want in result
 
@@ -198,12 +195,25 @@ class TestGetProjectRoot:
 
     @pytest.mark.asyncio
     async def test_read_write(self):
-        pathname = Path(__file__).parent / uuid.uuid4().hex / "test.tmp"
+        pathname = Path(__file__).parent / f"../../../workspace/unittest/{uuid.uuid4().hex}" / "test.tmp"
         await awrite(pathname, "ABC")
         data = await aread(pathname)
         assert data == "ABC"
         pathname.unlink(missing_ok=True)
 
+    @pytest.mark.asyncio
+    async def test_read_write_error_charset(self):
+        pathname = Path(__file__).parent / f"../../../workspace/unittest/{uuid.uuid4().hex}" / "test.txt"
+        content = "中国abc123\u27f6"
+        await awrite(filename=pathname, data=content)
+        data = await aread(filename=pathname)
+        assert data == content
+
+        content = "GB18030 是中国国家标准局发布的新一代中文字符集标准，是 GBK 的升级版，支持更广泛的字符范围。"
+        await awrite(filename=pathname, data=content, encoding="gb2312")
+        data = await aread(filename=pathname, encoding="utf-8")
+        assert data == content
+
 
 if __name__ == "__main__":
     pytest.main([__file__, "-s"])
diff --git a/tests/metagpt/utils/test_git_repository.py b/tests/metagpt/utils/test_git_repository.py
index ea28b8f0b..480a22e24 100644
--- a/tests/metagpt/utils/test_git_repository.py
+++ b/tests/metagpt/utils/test_git_repository.py
@@ -10,15 +10,14 @@
 import shutil
 from pathlib import Path
 
-import aiofiles
 import pytest
 
+from metagpt.utils.common import awrite
 from metagpt.utils.git_repository import GitRepository
 
 
 async def mock_file(filename, content=""):
-    async with aiofiles.open(str(filename), mode="w") as file:
-        await file.write(content)
+    await awrite(filename=filename, data=content)
 
 
 async def mock_repo(local_path) -> (GitRepository, Path):
diff --git a/tests/metagpt/utils/test_repo_to_markdown.py b/tests/metagpt/utils/test_repo_to_markdown.py
new file mode 100644
index 000000000..914c50dd7
--- /dev/null
+++ b/tests/metagpt/utils/test_repo_to_markdown.py
@@ -0,0 +1,25 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+import uuid
+from pathlib import Path
+
+import pytest
+
+from metagpt.utils.repo_to_markdown import repo_to_markdown
+
+
+@pytest.mark.parametrize(
+    ["repo_path", "output"],
+    [(Path(__file__).parent.parent, Path(__file__).parent.parent.parent / f"workspace/unittest/{uuid.uuid4().hex}.md")],
+)
+@pytest.mark.asyncio
+async def test_repo_to_markdown(repo_path: Path, output: Path):
+    markdown = await repo_to_markdown(repo_path=repo_path, output=output)
+    assert output.exists()
+    assert markdown
+
+    output.unlink(missing_ok=True)
+
+
+if __name__ == "__main__":
+    pytest.main([__file__, "-s"])
diff --git a/tests/metagpt/utils/test_s3.py b/tests/metagpt/utils/test_s3.py
index 34c21612c..ef13c2325 100644
--- a/tests/metagpt/utils/test_s3.py
+++ b/tests/metagpt/utils/test_s3.py
@@ -9,7 +9,6 @@ import uuid
 from pathlib import Path
 
 import aioboto3
-import aiofiles
 import pytest
 
 from metagpt.config2 import Config
@@ -46,7 +45,7 @@ async def test_s3(mocker):
     conn = S3(s3)
     object_name = "unittest.bak"
     await conn.upload_file(bucket=s3.bucket, local_path=__file__, object_name=object_name)
-    pathname = (Path(__file__).parent / uuid.uuid4().hex).with_suffix(".bak")
+    pathname = (Path(__file__).parent / "../../../workspace/unittest" / uuid.uuid4().hex).with_suffix(".bak")
     pathname.unlink(missing_ok=True)
     await conn.download_file(bucket=s3.bucket, object_name=object_name, local_path=str(pathname))
     assert pathname.exists()
@@ -54,8 +53,7 @@ async def test_s3(mocker):
     assert url
     bin_data = await conn.get_object(bucket=s3.bucket, object_name=object_name)
     assert bin_data
-    async with aiofiles.open(__file__, mode="r", encoding="utf-8") as reader:
-        data = await reader.read()
+    data = await aread(filename=__file__)
     res = await conn.cache(data, ".bak", "script")
     assert "http" in res
 
@@ -69,8 +67,6 @@ async def test_s3(mocker):
     except Exception:
         pass
 
-    await reader.close()
-
 
 if __name__ == "__main__":
     pytest.main([__file__, "-s"])
diff --git a/tests/metagpt/utils/test_text.py b/tests/metagpt/utils/test_text.py
index c9a9753be..319a4ebe0 100644
--- a/tests/metagpt/utils/test_text.py
+++ b/tests/metagpt/utils/test_text.py
@@ -22,7 +22,7 @@ def _paragraphs(n):
 @pytest.mark.parametrize(
     "msgs, model_name, system_text, reserved, expected",
     [
-        (_msgs(), "gpt-3.5-turbo", "System", 1500, 1),
+        (_msgs(), "gpt-3.5-turbo-0613", "System", 1500, 1),
         (_msgs(), "gpt-3.5-turbo-16k", "System", 3000, 6),
         (_msgs(), "gpt-3.5-turbo-16k", "Hello," * 1000, 3000, 5),
         (_msgs(), "gpt-4", "System", 2000, 3),
@@ -32,22 +32,23 @@ def _paragraphs(n):
     ],
 )
 def test_reduce_message_length(msgs, model_name, system_text, reserved, expected):
-    assert len(reduce_message_length(msgs, model_name, system_text, reserved)) / (len("Hello,")) / 1000 == expected
+    length = len(reduce_message_length(msgs, model_name, system_text, reserved)) / (len("Hello,")) / 1000
+    assert length == expected
 
 
 @pytest.mark.parametrize(
     "text, prompt_template, model_name, system_text, reserved, expected",
     [
-        (" ".join("Hello World." for _ in range(1000)), "Prompt: {}", "gpt-3.5-turbo", "System", 1500, 2),
+        (" ".join("Hello World." for _ in range(1000)), "Prompt: {}", "gpt-3.5-turbo-0613", "System", 1500, 2),
         (" ".join("Hello World." for _ in range(1000)), "Prompt: {}", "gpt-3.5-turbo-16k", "System", 3000, 1),
         (" ".join("Hello World." for _ in range(4000)), "Prompt: {}", "gpt-4", "System", 2000, 2),
         (" ".join("Hello World." for _ in range(8000)), "Prompt: {}", "gpt-4-32k", "System", 4000, 1),
-        (" ".join("Hello World" for _ in range(8000)), "Prompt: {}", "gpt-3.5-turbo", "System", 1000, 8),
+        (" ".join("Hello World" for _ in range(8000)), "Prompt: {}", "gpt-3.5-turbo-0613", "System", 1000, 8),
     ],
 )
 def test_generate_prompt_chunk(text, prompt_template, model_name, system_text, reserved, expected):
-    ret = list(generate_prompt_chunk(text, prompt_template, model_name, system_text, reserved))
-    assert len(ret) == expected
+    chunk = len(list(generate_prompt_chunk(text, prompt_template, model_name, system_text, reserved)))
+    assert chunk == expected
 
 
 @pytest.mark.parametrize(
diff --git a/tests/metagpt/utils/test_tree.py b/tests/metagpt/utils/test_tree.py
new file mode 100644
index 000000000..03a2a5606
--- /dev/null
+++ b/tests/metagpt/utils/test_tree.py
@@ -0,0 +1,64 @@
+from pathlib import Path
+from typing import List
+
+import pytest
+
+from metagpt.utils.tree import _print_tree, tree
+
+
+@pytest.mark.parametrize(
+    ("root", "rules"),
+    [
+        (str(Path(__file__).parent / "../.."), None),
+        (str(Path(__file__).parent / "../.."), str(Path(__file__).parent / "../../../.gitignore")),
+    ],
+)
+def test_tree(root: str, rules: str):
+    v = tree(root=root, gitignore=rules)
+    assert v
+
+
+@pytest.mark.parametrize(
+    ("root", "rules"),
+    [
+        (str(Path(__file__).parent / "../.."), None),
+        (str(Path(__file__).parent / "../.."), str(Path(__file__).parent / "../../../.gitignore")),
+    ],
+)
+def test_tree_command(root: str, rules: str):
+    v = tree(root=root, gitignore=rules, run_command=True)
+    assert v
+
+
+@pytest.mark.parametrize(
+    ("tree", "want"),
+    [
+        ({"a": {"b": {}, "c": {}}}, ["a", "+-- b", "+-- c"]),
+        ({"a": {"b": {}, "c": {"d": {}}}}, ["a", "+-- b", "+-- c", "    +-- d"]),
+        (
+            {"a": {"b": {"e": {"f": {}, "g": {}}}, "c": {"d": {}}}},
+            ["a", "+-- b", "|   +-- e", "|       +-- f", "|       +-- g", "+-- c", "    +-- d"],
+        ),
+        (
+            {"h": {"a": {"b": {"e": {"f": {}, "g": {}}}, "c": {"d": {}}}, "i": {}}},
+            [
+                "h",
+                "+-- a",
+                "|   +-- b",
+                "|   |   +-- e",
+                "|   |       +-- f",
+                "|   |       +-- g",
+                "|   +-- c",
+                "|       +-- d",
+                "+-- i",
+            ],
+        ),
+    ],
+)
+def test__print_tree(tree: dict, want: List[str]):
+    v = _print_tree(tree)
+    assert v == want
+
+
+if __name__ == "__main__":
+    pytest.main([__file__, "-s"])
diff --git a/tests/mock/mock_llm.py b/tests/mock/mock_llm.py
index b4cdfa0cf..c4262e080 100644
--- a/tests/mock/mock_llm.py
+++ b/tests/mock/mock_llm.py
@@ -8,7 +8,6 @@ from metagpt.provider.azure_openai_api import AzureOpenAILLM
 from metagpt.provider.constant import GENERAL_FUNCTION_SCHEMA
 from metagpt.provider.openai_api import OpenAILLM
 from metagpt.schema import Message
-from metagpt.utils.common import process_message
 
 OriginalLLM = OpenAILLM if config.llm.api_type == LLMType.OPENAI else AzureOpenAILLM
 
@@ -105,7 +104,7 @@ class MockLLM(OriginalLLM):
         return rsp
 
     async def aask_code(self, messages: Union[str, Message, list[dict]], **kwargs) -> dict:
-        msg_key = json.dumps(process_message(messages), ensure_ascii=False)
+        msg_key = json.dumps(self.format_msg(messages), ensure_ascii=False)
         rsp = await self._mock_rsp(msg_key, self.original_aask_code, messages, **kwargs)
         return rsp