Optimize code structure

Signed-off-by: Jael Gu <mengjia.gu@zilliz.com>
zilliztech · Nov 17, 2023 · cfec748 · cfec748
1 parent 40edc67
commit cfec748
Show file tree

Hide file tree

Showing 80 changed files with 60 additions and 107 deletions.
diff --git a/.github/workflows/pylint.yml b/.github/workflows/pylint.yml
@@ -21,6 +21,5 @@ jobs:
     - name: Python pylint
       run: |
         pip install pylint==2.10.2
-        pylint --rcfile=.pylintrc --output-format=colorized src_towhee
-        pylint --rcfile=.pylintrc --output-format=colorized src_langchain
+        pylint --rcfile=.pylintrc --output-format=colorized src
         pylint --rcfile=.pylintrc --output-format=colorized offline_tools
diff --git a/.gitignore b/.gitignore
@@ -1,2 +1,5 @@
 **/__pycache__
 **/tmp
+**/*.egg-info
+**/*.db
+**/build
diff --git a/Contributing.md b/Contributing.md
@@ -65,8 +65,8 @@ If you're interested in contributing to the `zilliztech/akcio` codebase, follow
 4. During development, you might want to run `pylint`. You can do so with one of the commands below:
     ```bash
     $ pip install pylint==2.10.2
-    $ pylint --rcfile=.pylintrc --output-format=colorized src_towhee
-    $ pylint --rcfile=.pylintrc --output-format=colorized src_langchain
+    $ pylint --rcfile=.pylintrc --output-format=colorized src.towhee
+    $ pylint --rcfile=.pylintrc --output-format=colorized src.langchain
     $ pylint --rcfile=.pylintrc --output-format=colorized offline_tools
     ```
 

diff --git a/README.md b/README.md
@@ -71,34 +71,34 @@ It also supports different integrations of LLM service and databases:
 
 The option using Towhee simplifies the process of building a system by providing [pre-defined pipelines](https://towhee.io/tasks/pipeline). These built-in pipelines require less coding and make system building much easier. If you require customization, you can either simply modify configuration or create your own pipeline with rich options of [Towhee Operators](https://towhee.io/tasks/operator).
 
-- [Pipelines](./src_towhee/pipelines)
+- [Pipelines](./src.towhee/pipelines)
     - **Insert:**
         The insert pipeline builds a knowledge base by saving documents and corresponding data in database(s).
     - **Search:**
         The search pipeline enables the question-answering capability powered by information retrieval (semantic search and optional keyword match) and LLM service.
     - **Prompt:** a prompt operator prepares messages for LLM by assembling system message, chat history, and the user's query processed by template.
 
-- [Memory](./src_towhee/memory):
-    The memory storage stores chat history to support context in conversation. (available: [most SQL](./src_towhee/memory/sql.py))
+- [Memory](./src.towhee/memory):
+    The memory storage stores chat history to support context in conversation. (available: [most SQL](./src.towhee/memory/sql.py))
 
 
 ### Option 2: LangChain
 
 The option using LangChain employs the use of [Agent](https://python.langchain.com/docs/modules/agents) in order to enable LLM to utilize specific tools, resulting in a greater demand for LLM's ability to comprehend tasks and make informed decisions.
 
-- [Agent](./src_langchain/agent)
+- [Agent](./src.langchain/agent)
     - **ChatAgent:** agent ensembles all modules together to build up qa system.
     - Other agents (todo)
-- [LLM](./src_langchain/llm)
+- [LLM](./src.langchain/llm)
     - **ChatLLM:** large language model or service to generate answers.
-- [Embedding](./src_langchain/embedding/)
+- [Embedding](./src.langchain/embedding/)
     - **TextEncoder:** encoder converts each text input to a vector.
     - Other encoders (todo)
-- [Store](./src_langchain/store)
+- [Store](./src.langchain/store)
     - **VectorStore:** vector database stores document chunks in embeddings, and performs document retrieval via semantic search.
-    - **ScalarStore:** optional, database stores metadata for each document chunk, which supports additional information retrieval. (available: [Elastic](src_langchain/store/scalar_store/es.py))
+    - **ScalarStore:** optional, database stores metadata for each document chunk, which supports additional information retrieval. (available: [Elastic](src.langchain/store/scalar_store/es.py))
     - **MemoryStore:** memory storage stores chat history to support context in conversation.
-- [DataLoader](./src_langchain/data_loader/)
+- [DataLoader](./src.langchain/data_loader/)
     - **DataParser:** tool loads data from given source and then splits documents into processed doc chunks.
 
 ## Deployment
@@ -228,7 +228,7 @@ The option using LangChain employs the use of [Agent](https://python.langchain.c
 
 ## Load data
 
-The `insert` function in [operations](./src_langchain/operations.py) loads project data from url(s) or file(s).
+The `insert` function in [operations](./src.langchain/operations.py) loads project data from url(s) or file(s).
 
 There are 2 options to load project data:
 

diff --git a/config.py b/config.py
@@ -115,7 +115,7 @@
     raise NotImplementedError
 
 RERANK_CONFIG = {
-    'rerank': True, # or False
+    'rerank': False, # or False
     'rerank_model': rerank_model,
     'threshold': 0.0,
     'rerank_device': -1  # -1 will use cpu
@@ -126,7 +126,7 @@
     'chunk_size': 300
 }
 
-QUESTIONGENERATOR_CONFIG = {
-    'model_name': 'gpt-3.5-turbo',
-    'temperature': 0,
-}
+# QUESTIONGENERATOR_CONFIG = {
+#     'model_name': 'gpt-3.5-turbo',
+#     'temperature': 0,
+# }
diff --git a/Dockerfile → docker/Dockerfile b/Dockerfile → docker/Dockerfile
diff --git a/gradio_demo.py b/gradio_demo.py
@@ -17,9 +17,9 @@
     'The service should start with either "--langchain" or "--towhee".'
 
 if USE_LANGCHAIN:
-    from src_langchain.operations import chat, insert, check, drop, get_history, clear_history, count  # pylint: disable=C0413
+    from src.langchain.operations import chat, insert, check, drop, get_history, clear_history, count  # pylint: disable=C0413
 if USE_TOWHEE:
-    from src_towhee.operations import chat, insert, check, drop, get_history, clear_history, count  # pylint: disable=C0413
+    from src.towhee.operations import chat, insert, check, drop, get_history, clear_history, count  # pylint: disable=C0413
 
 
 def create_session_id():

diff --git a/main.py b/main.py
@@ -40,10 +40,10 @@
     'The service should start with either "--langchain" or "--towhee".'
 
 if USE_LANGCHAIN:
-    from src_langchain.operations import chat, insert, drop, check, get_history, clear_history, count  # pylint: disable=C0413
+    from src.langchain.operations import chat, insert, drop, check, get_history, clear_history, count  # pylint: disable=C0413
     chat = partial(chat, enable_agent=ENABLE_AGENT)
 if USE_TOWHEE:
-    from src_towhee.operations import chat, insert, drop, check, get_history, clear_history, count  # pylint: disable=C0413
+    from src.towhee.operations import chat, insert, drop, check, get_history, clear_history, count  # pylint: disable=C0413
 if ENABLE_MONITER:
     from moniter import enable_moniter  # pylint: disable=C0413
     from prometheus_client import generate_latest, REGISTRY  # pylint: disable=C0413

diff --git a/offline_tools/insert.py b/offline_tools/insert.py
@@ -7,7 +7,7 @@
 
 sys.path.append(os.path.join(os.path.dirname(__file__), '..'))
 
-from src_langchain.embedding import TextEncoder  # pylint: disable=C0413
+from src.langchain.embedding import TextEncoder  # pylint: disable=C0413
 from offline_tools.generator_questions import get_output_csv  # pylint: disable=C0413
 from offline_tools.utils.stackoverflow_json2csv import stackoverflow_json2csv  # pylint: disable=C0413
 from offline_tools.utils.load_npy import langchain_load  # pylint: disable=C0413

diff --git a/offline_tools/utils/load_npy.py b/offline_tools/utils/load_npy.py
@@ -5,7 +5,7 @@
 
 sys.path.append(os.path.join(os.path.dirname(__file__), '..'))
 
-from src_langchain.store import DocStore  # pylint: disable=C0413
+from src.langchain.store import DocStore  # pylint: disable=C0413
 
 
 class DBReader(object):

diff --git a/requirements.txt b/requirements.txt
@@ -9,6 +9,7 @@ gradio>=3.30.0
 fastapi
 uvicorn
 towhee>=1.1.0
+pydantic<2.0
 pymilvus
 elasticsearch>=8.0.0
 prometheus-client
diff --git a/src_langchain/__init__.py → src/__init__.py b/src_langchain/__init__.py → src/__init__.py
diff --git a/src_langchain/store/memory_store/__init__.py → src/langchain/__init__.py b/src_langchain/store/memory_store/__init__.py → src/langchain/__init__.py
diff --git a/src_langchain/agent/README.md → src/langchain/agent/README.md b/src_langchain/agent/README.md → src/langchain/agent/README.md
@@ -47,8 +47,7 @@ agent = ChatAgent.from_llm_and_tools(
 # Define a chain
 agent_chain = AgentExecutor.from_agent_and_tools(
     agent=agent,
-    tools=tools,
-    verbose=False
+    tools=tools
     )
 
 # Run a test

diff --git a/src_langchain/agent/__init__.py → src/langchain/agent/__init__.py b/src_langchain/agent/__init__.py → src/langchain/agent/__init__.py
diff --git a/src_langchain/agent/chat_agent.py → src/langchain/agent/chat_agent.py b/src_langchain/agent/chat_agent.py → src/langchain/agent/chat_agent.py
diff --git a/src_langchain/agent/output_parser.py → src/langchain/agent/output_parser.py b/src_langchain/agent/output_parser.py → src/langchain/agent/output_parser.py
diff --git a/src_langchain/agent/prompt.py → src/langchain/agent/prompt.py b/src_langchain/agent/prompt.py → src/langchain/agent/prompt.py
diff --git a/src_langchain/data_loader/README.md → src/langchain/data_loader/README.md b/src_langchain/data_loader/README.md → src/langchain/data_loader/README.md
diff --git a/src_langchain/data_loader/__init__.py → src/langchain/data_loader/__init__.py b/src_langchain/data_loader/__init__.py → src/langchain/data_loader/__init__.py
diff --git a/src_langchain/data_loader/data_parser.py → src/langchain/data_loader/data_parser.py b/src_langchain/data_loader/data_parser.py → src/langchain/data_loader/data_parser.py
diff --git a/src_langchain/data_loader/data_splitter.py → src/langchain/data_loader/data_splitter.py b/src_langchain/data_loader/data_splitter.py → src/langchain/data_loader/data_splitter.py
diff --git a/src_langchain/embedding/README.md → src/langchain/embedding/README.md b/src_langchain/embedding/README.md → src/langchain/embedding/README.md
diff --git a/src_langchain/embedding/__init__.py → src/langchain/embedding/__init__.py b/src_langchain/embedding/__init__.py → src/langchain/embedding/__init__.py
diff --git a/...gchain/embedding/langchain_huggingface.py → ...gchain/embedding/langchain_huggingface.py b/...gchain/embedding/langchain_huggingface.py → ...gchain/embedding/langchain_huggingface.py
diff --git a/src_langchain/embedding/openai_embedding.py → src/langchain/embedding/openai_embedding.py b/src_langchain/embedding/openai_embedding.py → src/langchain/embedding/openai_embedding.py
diff --git a/src_langchain/llm/README.md → src/langchain/llm/README.md b/src_langchain/llm/README.md → src/langchain/llm/README.md
diff --git a/src_langchain/llm/__init__.py → src/langchain/llm/__init__.py b/src_langchain/llm/__init__.py → src/langchain/llm/__init__.py
diff --git a/src_langchain/llm/dolly_chat.py → src/langchain/llm/dolly_chat.py b/src_langchain/llm/dolly_chat.py → src/langchain/llm/dolly_chat.py
diff --git a/src_langchain/llm/ernie.py → src/langchain/llm/ernie.py b/src_langchain/llm/ernie.py → src/langchain/llm/ernie.py
diff --git a/src_langchain/llm/minimax_chat.py → src/langchain/llm/minimax_chat.py b/src_langchain/llm/minimax_chat.py → src/langchain/llm/minimax_chat.py
diff --git a/src_langchain/llm/openai_chat.py → src/langchain/llm/openai_chat.py b/src_langchain/llm/openai_chat.py → src/langchain/llm/openai_chat.py
diff --git a/src_langchain/operations.py → src/langchain/operations.py b/src_langchain/operations.py → src/langchain/operations.py
@@ -43,7 +43,6 @@ def chat(session_id, project, question, enable_agent=False):
             agent=agent,
             tools=tools,
             memory=memory_db.memory,
-            verbose=False
         )
         try:
             final_answer = agent_chain.run(input=question)

diff --git a/src_langchain/store/README.md → src/langchain/store/README.md b/src_langchain/store/README.md → src/langchain/store/README.md
diff --git a/src_langchain/store/__init__.py → src/langchain/store/__init__.py b/src_langchain/store/__init__.py → src/langchain/store/__init__.py
diff --git a/src_langchain/store/scalar_store/__init__.py → src/langchain/store/memory_store/__init__.py b/src_langchain/store/scalar_store/__init__.py → src/langchain/store/memory_store/__init__.py
diff --git a/src_langchain/store/memory_store/pg.py → src/langchain/store/memory_store/pg.py b/src_langchain/store/memory_store/pg.py → src/langchain/store/memory_store/pg.py
diff --git a/src_langchain/store/memory_store/sql.py → src/langchain/store/memory_store/sql.py b/src_langchain/store/memory_store/sql.py → src/langchain/store/memory_store/sql.py
diff --git a/src_langchain/store/vector_store/__init__.py → src/langchain/store/scalar_store/__init__.py b/src_langchain/store/vector_store/__init__.py → src/langchain/store/scalar_store/__init__.py
diff --git a/src_langchain/store/scalar_store/es.py → src/langchain/store/scalar_store/es.py b/src_langchain/store/scalar_store/es.py → src/langchain/store/scalar_store/es.py
diff --git a/src_towhee/prompts/__init__.py → src/langchain/store/vector_store/__init__.py b/src_towhee/prompts/__init__.py → src/langchain/store/vector_store/__init__.py
diff --git a/src_langchain/store/vector_store/milvus.py → src/langchain/store/vector_store/milvus.py b/src_langchain/store/vector_store/milvus.py → src/langchain/store/vector_store/milvus.py
diff --git a/tests/unit_tests/src_langchain/__init__.py → src/llamaindex/__init__.py b/tests/unit_tests/src_langchain/__init__.py → src/llamaindex/__init__.py
diff --git a/src_towhee/base.py → src/towhee/base.py b/src_towhee/base.py → src/towhee/base.py
diff --git a/src_towhee/memory/README.md → src/towhee/memory/README.md b/src_towhee/memory/README.md → src/towhee/memory/README.md
diff --git a/src_towhee/memory/__init__.py → src/towhee/memory/__init__.py b/src_towhee/memory/__init__.py → src/towhee/memory/__init__.py
diff --git a/src_towhee/memory/sql.py → src/towhee/memory/sql.py b/src_towhee/memory/sql.py → src/towhee/memory/sql.py
@@ -8,7 +8,7 @@
 
 sys.path.append(os.path.join(os.path.dirname(__file__), '../..'))
 
-from src_towhee.base import BaseMemory # pylint: disable=C0413
+from src.towhee.base import BaseMemory # pylint: disable=C0413
 from config import MEMORYDB_CONFIG # pylint: disable=C0413
 
 

diff --git a/src_towhee/operations.py → src/towhee/operations.py b/src_towhee/operations.py → src/towhee/operations.py
@@ -4,8 +4,8 @@
 
 sys.path.append(os.path.join(os.path.dirname(__file__), '..'))
 
-from src_towhee.pipelines import TowheePipelines  # pylint: disable=C0413
-from src_towhee.memory import MemoryStore  # pylint: disable=C0413
+from src.towhee.pipelines import TowheePipelines  # pylint: disable=C0413
+from src.towhee.memory import MemoryStore  # pylint: disable=C0413
 
 
 logger = logging.getLogger(__name__)

diff --git a/src_towhee/pipelines/README.md → src/towhee/pipelines/README.md b/src_towhee/pipelines/README.md → src/towhee/pipelines/README.md
diff --git a/src_towhee/pipelines/__init__.py → src/towhee/pipelines/__init__.py b/src_towhee/pipelines/__init__.py → src/towhee/pipelines/__init__.py
@@ -14,9 +14,9 @@
     RERANK_CONFIG, QUERY_MODE, INSERT_MODE,
     DATAPARSER_CONFIG
 )
-from src_towhee.base import BasePipelines  # pylint: disable=C0413
-from src_towhee.pipelines.search import build_search_pipeline  # pylint: disable=C0413
-from src_towhee.pipelines.insert import build_insert_pipeline  # pylint: disable=C0413
+from src.towhee.base import BasePipelines  # pylint: disable=C0413
+from src.towhee.pipelines.search import build_search_pipeline  # pylint: disable=C0413
+from src.towhee.pipelines.insert import build_insert_pipeline  # pylint: disable=C0413
 
 
 class TowheePipelines(BasePipelines):

diff --git a/src_towhee/pipelines/insert/__init__.py → src/towhee/pipelines/insert/__init__.py b/src_towhee/pipelines/insert/__init__.py → src/towhee/pipelines/insert/__init__.py
diff --git a/...ee/pipelines/insert/generate_questions.py → ...ee/pipelines/insert/generate_questions.py b/...ee/pipelines/insert/generate_questions.py → ...ee/pipelines/insert/generate_questions.py
diff --git a/src_towhee/pipelines/search/__init__.py → src/towhee/pipelines/search/__init__.py b/src_towhee/pipelines/search/__init__.py → src/towhee/pipelines/search/__init__.py
diff --git a/src_towhee/pipelines/search/rewrite_query.py → src/towhee/pipelines/search/rewrite_query.py b/src_towhee/pipelines/search/rewrite_query.py → src/towhee/pipelines/search/rewrite_query.py
diff --git a/src_towhee/pipelines/utils.py → src/towhee/pipelines/utils.py b/src_towhee/pipelines/utils.py → src/towhee/pipelines/utils.py
diff --git a/...nit_tests/src_langchain/agent/__init__.py → src/towhee/prompts/__init__.py b/...nit_tests/src_langchain/agent/__init__.py → src/towhee/prompts/__init__.py
diff --git a/src_towhee/prompts/en.py → src/towhee/prompts/en.py b/src_towhee/prompts/en.py → src/towhee/prompts/en.py
diff --git a/src_towhee/prompts/zh.py → src/towhee/prompts/zh.py b/src_towhee/prompts/zh.py → src/towhee/prompts/zh.py
diff --git a/...sts/src_langchain/data_loader/__init__.py → tests/unit_tests/src/__init__.py b/...sts/src_langchain/data_loader/__init__.py → tests/unit_tests/src/__init__.py
diff --git a/...tests/src_langchain/embedding/__init__.py → tests/unit_tests/src/langchain/__init__.py b/...tests/src_langchain/embedding/__init__.py → tests/unit_tests/src/langchain/__init__.py
diff --git a/.../unit_tests/src_langchain/llm/__init__.py → ...nit_tests/src/langchain/agent/__init__.py b/.../unit_tests/src_langchain/llm/__init__.py → ...nit_tests/src/langchain/agent/__init__.py
diff --git a/...t_tests/src_langchain/agent/test_agent.py → ...t_tests/src/langchain/agent/test_agent.py b/...t_tests/src_langchain/agent/test_agent.py → ...t_tests/src/langchain/agent/test_agent.py
@@ -1,13 +1,8 @@
-import os
-import sys
 import unittest
-
 from langchain.agents import AgentExecutor, Tool
 from langchain.llms.fake import FakeListLLM
 
-sys.path.append(os.path.join(os.path.dirname(__file__), '../../../..'))
-
-from src_langchain.agent import ChatAgent
+from src.langchain.agent import ChatAgent
 
 
 class TestChatAgent(unittest.TestCase):
@@ -25,8 +20,7 @@ class TestChatAgent(unittest.TestCase):
     def test_run_chat_agent(self):
         agent_executor = AgentExecutor.from_agent_and_tools(
             agent=self.chat_agent,
-            tools=self.tools,
-            verbose=False
+            tools=self.tools
         )
         final_answer = agent_executor.run(input='whats 2 + 2', chat_history=[])
         assert final_answer == self.responses[1]

diff --git a/...src_langchain/agent/test_output_parser.py → ...src/langchain/agent/test_output_parser.py b/...src_langchain/agent/test_output_parser.py → ...src/langchain/agent/test_output_parser.py
@@ -1,13 +1,8 @@
-import os
-import sys
 import unittest
-
 from langchain.schema import AgentAction, AgentFinish
 
-sys.path.append(os.path.join(os.path.dirname(__file__), '../../../..'))
-
-from src_langchain.agent.prompt import FORMAT_INSTRUCTIONS
-from src_langchain.agent.output_parser import OutputParser
+from src.langchain.agent.prompt import FORMAT_INSTRUCTIONS
+from src.langchain.agent.output_parser import OutputParser
 
 
 class TestOutputParser(unittest.TestCase):

diff --git a/tests/unit_tests/src_towhee/__init__.py → ...sts/src/langchain/data_loader/__init__.py b/tests/unit_tests/src_towhee/__init__.py → ...sts/src/langchain/data_loader/__init__.py
diff --git a/...langchain/data_loader/test_data_parser.py → ...langchain/data_loader/test_data_parser.py b/...langchain/data_loader/test_data_parser.py → ...langchain/data_loader/test_data_parser.py
@@ -1,16 +1,13 @@
 import io
-import os
-import sys
 import tempfile
 import unittest
 from unittest.mock import patch
 
 from langchain.schema import Document
 from langchain.text_splitter import RecursiveCharacterTextSplitter
 
-sys.path.append(os.path.join(os.path.dirname(__file__), '../../../..'))
 
-from src_langchain.data_loader import DataParser
+from src.langchain.data_loader import DataParser
 
 
 class TestDataParser(unittest.TestCase):

diff --git a/...ngchain/data_loader/test_data_splitter.py → ...ngchain/data_loader/test_data_splitter.py b/...ngchain/data_loader/test_data_splitter.py → ...ngchain/data_loader/test_data_splitter.py
@@ -1,10 +1,6 @@
-import os
-import sys
 import unittest
 
-sys.path.append(os.path.join(os.path.dirname(__file__), '../../../..'))
-
-from src_langchain.data_loader.data_splitter import MarkDownSplitter
+from src.langchain.data_loader.data_splitter import MarkDownSplitter
 
 
 class TestMarkDownSplitter(unittest.TestCase):

diff --git a/.../unit_tests/src_towhee/memory/__init__.py → ...tests/src/langchain/embedding/__init__.py b/.../unit_tests/src_towhee/memory/__init__.py → ...tests/src/langchain/embedding/__init__.py
diff --git a/...n/embedding/test_langchain_huggingface.py → ...n/embedding/test_langchain_huggingface.py b/...n/embedding/test_langchain_huggingface.py → ...n/embedding/test_langchain_huggingface.py
@@ -1,12 +1,8 @@
-import os
-import sys
 import unittest
 from unittest.mock import patch
-
 import numpy as np
 
-sys.path.append(os.path.join(os.path.dirname(__file__), '../../../../..'))
-from src_langchain.embedding.langchain_huggingface import TextEncoder
+from src.langchain.embedding.langchain_huggingface import TextEncoder
 
 
 class TestLangchainHuggingface(unittest.TestCase):

diff --git a/...gchain/embedding/test_openai_embedding.py → ...gchain/embedding/test_openai_embedding.py b/...gchain/embedding/test_openai_embedding.py → ...gchain/embedding/test_openai_embedding.py
@@ -1,12 +1,8 @@
-import os
-import sys
 import unittest
 from unittest.mock import patch
-
 import numpy as np
 
-sys.path.append(os.path.join(os.path.dirname(__file__), '../../../../..'))
-from src_langchain.embedding.openai_embedding import TextEncoder
+from src.langchain.embedding.openai_embedding import TextEncoder
 
 
 class TestOpenAIEmbedding(unittest.TestCase):

diff --git a/...it_tests/src_towhee/pipelines/__init__.py → .../unit_tests/src/langchain/llm/__init__.py b/...it_tests/src_towhee/pipelines/__init__.py → .../unit_tests/src/langchain/llm/__init__.py
diff --git a/...ests/src_langchain/llm/test_dolly_chat.py → ...ests/src/langchain/llm/test_dolly_chat.py b/...ests/src_langchain/llm/test_dolly_chat.py → ...ests/src/langchain/llm/test_dolly_chat.py
@@ -1,11 +1,8 @@
-import os
-import sys
 import unittest
 from unittest.mock import patch
 
 from langchain.schema import HumanMessage
 
-sys.path.append(os.path.join(os.path.dirname(__file__), '../../../../..'))
 
 MOCK_ANSWER = 'mock answer'
 
@@ -18,7 +15,7 @@ def __call__(self, prompt):
 
         with patch('transformers.pipeline') as mock_pipelines:
             mock_pipelines.return_value = MockGenerateText()
-            from src_langchain.llm.dolly_chat import ChatLLM
+            from src.langchain.llm.dolly_chat import ChatLLM
 
             chat_llm = ChatLLM(model_name='mock', device='cpu', )
             messages = [HumanMessage(content='hello')]

diff --git a/...nit_tests/src_langchain/llm/test_ernie.py → ...nit_tests/src/langchain/llm/test_ernie.py b/...nit_tests/src_langchain/llm/test_ernie.py → ...nit_tests/src/langchain/llm/test_ernie.py
@@ -1,11 +1,7 @@
-import os
-import sys
 import unittest
 from unittest.mock import patch
 from langchain.schema import HumanMessage, AIMessage
 
-sys.path.append(os.path.join(os.path.dirname(__file__), '../../../..'))
-
 
 class TestERNIE(unittest.TestCase):
     def test_generate(self):
@@ -27,7 +23,7 @@ def test_generate(self):
                                   )
             mock_post.return_value = mock_res
 
-            from src_langchain.llm.ernie import ChatLLM
+            from src.langchain.llm.ernie import ChatLLM
 
             EB_API_TYPE = 'mock_type'
             EB_ACCESS_TOKEN = 'mock_token'

diff --git a/...sts/src_langchain/llm/test_openai_chat.py → ...sts/src/langchain/llm/test_openai_chat.py b/...sts/src_langchain/llm/test_openai_chat.py → ...sts/src/langchain/llm/test_openai_chat.py
@@ -1,13 +1,9 @@
-import os
-import sys
 import unittest
 
-sys.path.append(os.path.join(os.path.dirname(__file__), '../../../../..'))
-
 
 class TestOpenAIChat(unittest.TestCase):
     def test_init(self):
-        from src_langchain.llm.openai_chat import ChatLLM
+        from src.langchain.llm.openai_chat import ChatLLM
         chat_llm = ChatLLM(openai_api_key='mock-key')
         self.assertEqual(chat_llm.__class__.__name__, 'ChatLLM')
 

diff --git a/tests/unit_tests/src/towhee/__init__.py b/tests/unit_tests/src/towhee/__init__.py
diff --git a/tests/unit_tests/src/towhee/akcio_ut.txt b/tests/unit_tests/src/towhee/akcio_ut.txt
@@ -0,0 +1 @@
+This is test content.
diff --git a/tests/unit_tests/src/towhee/memory/__init__.py b/tests/unit_tests/src/towhee/memory/__init__.py
diff --git a/.../unit_tests/src_towhee/memory/test_sql.py → .../unit_tests/src/towhee/memory/test_sql.py b/.../unit_tests/src_towhee/memory/test_sql.py → .../unit_tests/src/towhee/memory/test_sql.py
@@ -1,11 +1,8 @@
 import os
-import sys
 import unittest
 
-sys.path.append(os.path.join(os.path.dirname(__file__), '../../../..'))
-
-from src_towhee.base import BaseMemory  # pylint: disable=C0413
-from src_towhee.memory.sql import MemoryStore  # pylint: disable=C0413
+from src.towhee.base import BaseMemory
+from src.towhee.memory.sql import MemoryStore
 
 
 class TestSql(unittest.TestCase):

diff --git a/tests/unit_tests/src/towhee/pipelines/__init__.py b/tests/unit_tests/src/towhee/pipelines/__init__.py
diff --git a/...ts/src_towhee/pipelines/test_pipelines.py → ...ts/src/towhee/pipelines/test_pipelines.py b/...ts/src_towhee/pipelines/test_pipelines.py → ...ts/src/towhee/pipelines/test_pipelines.py
@@ -1,19 +1,15 @@
 import unittest
 from unittest.mock import patch
-
 import json
-import sys
 import os
-
 from milvus import MilvusServer
 
-sys.path.append(os.path.join(os.path.dirname(__file__), '../../../..'))
 
 from config import (  # pylint: disable=C0413
     CHAT_CONFIG, TEXTENCODER_CONFIG,
     VECTORDB_CONFIG, RERANK_CONFIG,
     )
-from src_towhee.pipelines import TowheePipelines  # pylint: disable=C0413
+from src.towhee.pipelines import TowheePipelines  # pylint: disable=C0413
 
 milvus_server = MilvusServer()