diff --git a/.gitignore b/.gitignore
index 4c503a3..c982df7 100644
--- a/.gitignore
+++ b/.gitignore
@@ -159,3 +159,5 @@ cython_debug/
 #  and can be added to the global gitignore or merged into this file.  For a more nuclear
 #  option (not recommended) you can uncomment the following to ignore the entire idea folder.
 #.idea/
+
+.cosine
\ No newline at end of file
diff --git a/agent/src/og_agent/agent_api_server.py b/agent/src/og_agent/agent_api_server.py
index e62e62a..f28b25a 100644
--- a/agent/src/og_agent/agent_api_server.py
+++ b/agent/src/og_agent/agent_api_server.py
@@ -178,10 +178,13 @@ class TaskRequest(BaseModel):
 
 
 async def run_task(task: TaskRequest, key):
-    async for respond in agent_sdk.prompt(task.prompt, key, files=task.input_files, context_id=task.context_id):
+    async for respond in agent_sdk.prompt(
+        task.prompt, key, files=task.input_files, context_id=task.context_id
+    ):
         response = StepResponse.new_from(respond).model_dump(exclude_none=True)
         yield "data: %s\n" % json.dumps(response)
 
+
 @app.post("/process")
 async def process_task(
     task: TaskRequest,
diff --git a/agent/src/og_agent/base_agent.py b/agent/src/og_agent/base_agent.py
index 97a8286..117315d 100644
--- a/agent/src/og_agent/base_agent.py
+++ b/agent/src/og_agent/base_agent.py
@@ -63,6 +63,7 @@ class TypingState:
     MESSAGE = 4
     OTHER = 5
 
+
 class BaseAgent:
 
     def __init__(self, sdk):
@@ -70,7 +71,9 @@ def __init__(self, sdk):
         self.model_name = ""
         self.agent_memories = {}
 
-    def create_new_memory_with_default_prompt(self, user_name, user_id, actions = ACTIONS):
+    def create_new_memory_with_default_prompt(
+        self, user_name, user_id, actions=ACTIONS
+    ):
         """
         create a new memory for the user
         """
@@ -386,7 +389,6 @@ async def extract_message(
                         response_token_count + context_output_token_count
                     )
                     if is_json_format:
-
                         (
                             new_text_content,
                             new_code_content,
diff --git a/agent/src/og_agent/llama_agent.py b/agent/src/og_agent/llama_agent.py
index 87c412b..7c2652c 100644
--- a/agent/src/og_agent/llama_agent.py
+++ b/agent/src/og_agent/llama_agent.py
@@ -36,51 +36,6 @@ def _output_exception(self):
             "Sorry, the LLM did return nothing, You can use a better performance model"
         )
 
-
-    def _format_output(self, json_response):
-        """
-        format the response and send it to the user
-        """
-        answer = json_response["explanation"]
-        if json_response["action"] == "no_action":
-            return answer
-        elif json_response["action"] == "show_sample_code":
-            return ""
-        else:
-            code = json_response.get("code", None)
-            answer_code = """%s
-```%s
-%s
-```
-""" % (
-                answer,
-                json_response.get("language", "python"),
-                code if code else "",
-            )
-            return answer_code
-
-    async def handle_show_sample_code(
-        self, json_response, queue, context, task_context
-    ):
-        code = json_response["code"]
-        explanation = json_response["explanation"]
-        saved_filenames = json_response.get("saved_filenames", [])
-        tool_input = json.dumps({
-            "code": code,
-            "explanation": explanation,
-            "saved_filenames": saved_filenames,
-            "language": json_response.get("language", "text"),
-        })
-        await queue.put(
-            TaskResponse(
-                state=task_context.to_context_state_proto(),
-                response_type=TaskResponse.OnStepActionStart,
-                on_step_action_start=OnStepActionStart(
-                    input=tool_input, tool="show_sample_code"
-                ),
-            )
-        )
-
     async def handle_bash_code(
         self, json_response, queue, context, task_context, task_opt
     ):
@@ -130,7 +85,7 @@ async def handle_python_function(
                 state=task_context.to_context_state_proto(),
                 response_type=TaskResponse.OnStepActionStart,
                 on_step_action_start=OnStepActionStart(
-                    input=tool_input, tool='execute'
+                    input=tool_input, tool="execute"
                 ),
             )
         )
@@ -176,10 +131,10 @@ async def arun(self, request, queue, context, task_opt):
         context_id = (
             request.context_id
             if request.context_id
-            else self.create_new_memory_with_default_prompt("", "", actions=[FUNCTION_EXECUTE,
-                                                                             FUNCTION_DIRECT_MESSAGE])
+            else self.create_new_memory_with_default_prompt(
+                "", "", actions=[FUNCTION_EXECUTE, FUNCTION_DIRECT_MESSAGE]
+            )
         )
-
         if context_id not in self.agent_memories:
             await queue.put(
                 TaskResponse(
@@ -190,7 +145,6 @@ async def arun(self, request, queue, context, task_opt):
                 )
             )
             return
-
         agent_memory = self.agent_memories[context_id]
         agent_memory.update_options(self.memory_option)
         agent_memory.append_chat_message(
@@ -253,7 +207,8 @@ async def arun(self, request, queue, context, task_opt):
                     break
                 logger.debug(f" llama response {json_response}")
                 if (
-                    'function_call'in json_response and json_response["function_call"] == "execute"
+                    "function_call" in json_response
+                    and json_response["function_call"] == "execute"
                 ):
                     agent_memory.append_chat_message(message)
                     tools_mapping = {
@@ -261,8 +216,14 @@ async def arun(self, request, queue, context, task_opt):
                         "bash": self.handle_bash_code,
                     }
 
-                    function_result = await tools_mapping[json_response["arguments"]['language']](
-                        json_response['arguments'], queue, context, task_context, task_opt
+                    function_result = await tools_mapping[
+                        json_response["arguments"]["language"]
+                    ](
+                        json_response["arguments"],
+                        queue,
+                        context,
+                        task_context,
+                        task_opt,
                     )
 
                     logger.debug(f"the function result {function_result}")
@@ -287,23 +248,31 @@ async def arun(self, request, queue, context, task_opt):
                             "role": "user",
                             "content": f"{action_output} \n {function_result.console_stdout}",
                         })
-                        agent_memory.append_chat_message({"role": "user", "content": current_question})
+                        agent_memory.append_chat_message(
+                            {"role": "user", "content": current_question}
+                        )
                     elif function_result.has_error:
                         agent_memory.append_chat_message({
                             "role": "user",
                             "content": f"{action_output} \n {function_result.console_stderr}",
                         })
                         current_question = f"Generate a new step to fix the above error"
-                        agent_memory.append_chat_message({"role": "user", "content": current_question})
+                        agent_memory.append_chat_message(
+                            {"role": "user", "content": current_question}
+                        )
                     else:
                         agent_memory.append_chat_message({
                             "role": "user",
                             "content": f"{action_output} \n {function_result.console_stdout}",
                         })
-                        agent_memory.append_chat_message({
-                            "role": "user", "content": current_question})
-                elif 'function_call' in json_response and json_response["function_call"] == "direct_message":
-                    message = json_response['arguments']['message']
+                        agent_memory.append_chat_message(
+                            {"role": "user", "content": current_question}
+                        )
+                elif (
+                    "function_call" in json_response
+                    and json_response["function_call"] == "direct_message"
+                ):
+                    message = json_response["arguments"]["message"]
                     await queue.put(
                         TaskResponse(
                             state=task_context.to_context_state_proto(),
diff --git a/agent/src/og_agent/llama_client.py b/agent/src/og_agent/llama_client.py
index 234f247..465ab19 100644
--- a/agent/src/og_agent/llama_client.py
+++ b/agent/src/og_agent/llama_client.py
@@ -20,7 +20,7 @@ def __init__(self, endpoint, key, grammar):
         super().__init__(endpoint + "/v1/chat/completions", key)
         self.grammar = grammar
 
-    async def chat(self, messages, model, temperature=0, max_tokens=1024, stop=[]):
+    async def chat(self, messages, model, temperature=0, max_tokens=1024, stop=["\n"]):
         data = {
             "messages": messages,
             "temperature": temperature,
diff --git a/agent/src/og_agent/prompt.py b/agent/src/og_agent/prompt.py
index 82b6a15..9ba4b77 100644
--- a/agent/src/og_agent/prompt.py
+++ b/agent/src/og_agent/prompt.py
@@ -17,52 +17,50 @@
     "Use `execute` action to execute any code and `direct_message` action to send message to user",
 ]
 
-FUNCTION_EXECUTE= ActionDesc(
-        name="execute",
-        desc="This action executes code in your programming environment and returns the output",
-        parameters=json.dumps({
-            "type": "object",
-            "properties": {
-                "explanation": {
-                    "type": "string",
-                    "description": "the explanation about the code parameters",
-                },
-                "code": {
-                    "type": "string",
-                    "description": "the bash code to be executed",
-                },
-                "language": {
-                    "type": "string",
-                    "description": "the language of the code, only python and bash are supported",
-                },
-                "saved_filenames": {
-                    "type": "array",
-                    "items": {"type": "string"},
-                    "description": "A list of filenames that were created by the code",
-                },
+FUNCTION_EXECUTE = ActionDesc(
+    name="execute",
+    desc="This action executes code in your programming environment and returns the output",
+    parameters=json.dumps({
+        "type": "object",
+        "properties": {
+            "explanation": {
+                "type": "string",
+                "description": "the explanation about the code parameters",
             },
-            "required": ["explanation", "code", "language"],
-        }),
-    )
+            "code": {
+                "type": "string",
+                "description": "the bash code to be executed",
+            },
+            "language": {
+                "type": "string",
+                "description": "the language of the code, only python and bash are supported",
+            },
+            "saved_filenames": {
+                "type": "array",
+                "items": {"type": "string"},
+                "description": "A list of filenames that were created by the code",
+            },
+        },
+        "required": ["explanation", "code", "language"],
+    }),
+)
 
-FUNCTION_DIRECT_MESSAGE= ActionDesc(
-        name="direct_message",
-        desc="This action sends a direct message to user.",
-        parameters=json.dumps({
-            "type": "object",
-            "properties": {
-                "message": {
-                    "type": "string",
-                    "description": "the message will be sent to user",
-                },
+FUNCTION_DIRECT_MESSAGE = ActionDesc(
+    name="direct_message",
+    desc="This action sends a direct message to user.",
+    parameters=json.dumps({
+        "type": "object",
+        "properties": {
+            "message": {
+                "type": "string",
+                "description": "the message will be sent to user",
             },
-            "required": ["message"],
-        }),
+        },
+        "required": ["message"],
+    }),
 )
 
-ACTIONS = [
-    FUNCTION_EXECUTE
-]
+ACTIONS = [FUNCTION_EXECUTE]
 
 OUTPUT_FORMAT = """The output format must be a JSON format with the following fields:
 * function_call: The name of the action
diff --git a/agent/tests/openai_agent_tests.py b/agent/tests/openai_agent_tests.py
index f353899..9013190 100644
--- a/agent/tests/openai_agent_tests.py
+++ b/agent/tests/openai_agent_tests.py
@@ -158,7 +158,6 @@ async def test_openai_agent_call_execute_bash_code(mocker, kernel_sdk):
         assert console_output[0].console_stdout == "hello world\n", "bad console output"
 
 
-
 @pytest.mark.asyncio
 async def test_openai_agent_call_execute_python_code(mocker, kernel_sdk):
     kernel_sdk.connect()
diff --git a/agent/tests/tokenizer_test.py b/agent/tests/tokenizer_test.py
new file mode 100644
index 0000000..3540d7d
--- /dev/null
+++ b/agent/tests/tokenizer_test.py
@@ -0,0 +1,20 @@
+# vim:fenc=utf-8
+
+# SPDX-FileCopyrightText: 2023 imotai <jackwang@octogen.dev>
+# SPDX-FileContributor: imotai
+#
+# SPDX-License-Identifier: Elastic-2.0
+
+""" """
+
+import logging
+import io
+from og_agent.tokenizer import tokenize
+
+logger = logging.getLogger(__name__)
+
+
+def test_parse_explanation():
+    arguments = """{"function_call":"execute", "arguments": {"explanation":"h"""
+    for token_state, token in tokenize(io.StringIO(arguments)):
+        logger.info(f"token_state: {token_state}, token: {token}")
diff --git a/roles/README.md b/roles/README.md
new file mode 100644
index 0000000..2bbb978
--- /dev/null
+++ b/roles/README.md
@@ -0,0 +1 @@
+# the role module
diff --git a/roles/setup.py b/roles/setup.py
new file mode 100644
index 0000000..032689a
--- /dev/null
+++ b/roles/setup.py
@@ -0,0 +1,26 @@
+# Copyright (C) 2023 dbpunk.com Author imotai <codego.me@gmail.com>
+# SPDX-FileCopyrightText: 2023 imotai <jackwang@octogen.dev>
+# SPDX-FileContributor: imotai
+#
+# SPDX-License-Identifier: Elastic-2.0
+
+""" """
+from setuptools import setup, find_packages
+
+setup(
+    name="og_roles",
+    version="0.3.6",
+    description="Open source llm agent service",
+    author="imotai",
+    author_email="wangtaize@dbpunk.com",
+    url="https://github.com/dbpunk-labs/octogen",
+    long_description=open("README.md").read(),
+    long_description_content_type="text/markdown",
+    packages=[
+        "og_roles",
+    ],
+    package_dir={
+        "og_roles": "src/og_roles",
+    },
+    package_data={},
+)
diff --git a/roles/src/og_roles/__init__.py b/roles/src/og_roles/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/roles/src/og_roles/code_interpreter.py b/roles/src/og_roles/code_interpreter.py
new file mode 100644
index 0000000..c3727cd
--- /dev/null
+++ b/roles/src/og_roles/code_interpreter.py
@@ -0,0 +1,77 @@
+# vim:fenc=utf-8
+
+# SPDX-FileCopyrightText: 2023 imotai <jackwang@octogen.dev>
+# SPDX-FileContributor: imotai
+#
+# SPDX-License-Identifier: Elastic-2.0
+
+"""
+
+"""
+import json
+from og_proto.prompt_pb2 import ActionDesc
+
+
+ROLE = f"""You are the Programming Copilot, a world-class programmer to complete any goal by executing code"""
+RULES = [
+    "To complete the goal, write a plan and execute it step-by-step, limiting the number of steps to five",
+    "Every step must include the explanation and the code block. if the code block has any display data, save it as a file and add it to saved_filenames field",
+    "You have a fully controlled programming environment to execute code with internet connection but sudo is not allowed",
+    "You must try to correct your code when you get errors from the output",
+    "You can install new package with pip",
+    "Use `execute` action to execute any code and `direct_message` action to send message to user",
+]
+FUNCTION_EXECUTE= ActionDesc(
+        name="execute",
+        desc="This action executes code in your programming environment and returns the output",
+        parameters=json.dumps({
+            "type": "object",
+            "properties": {
+                "explanation": {
+                    "type": "string",
+                    "description": "the explanation about the code parameters",
+                },
+                "code": {
+                    "type": "string",
+                    "description": "the bash code to be executed",
+                },
+                "language": {
+                    "type": "string",
+                    "description": "the language of the code, only python and bash are supported",
+                },
+                "saved_filenames": {
+                    "type": "array",
+                    "items": {"type": "string"},
+                    "description": "A list of filenames that were created by the code",
+                },
+            },
+            "required": ["explanation", "code", "language"],
+        }),
+    )
+
+FUNCTION_DIRECT_MESSAGE= ActionDesc(
+        name="direct_message",
+        desc="This action sends a direct message to user.",
+        parameters=json.dumps({
+            "type": "object",
+            "properties": {
+                "message": {
+                    "type": "string",
+                    "description": "the message will be sent to user",
+                },
+            },
+            "required": ["message"],
+        }),
+)
+ACTIONS = [
+    FUNCTION_EXECUTE
+]
+OUTPUT_FORMAT = """The output format must be a JSON format with the following fields:
+* function_call: The name of the action
+* arguments: The arguments of the action
+"""
+
+OCTOGEN_CODELLAMA_MID_INS = """The above output of the %s determines whether the execution is successful. 
+If successful, go to the next step. If the current step is the final step, summarize the entire plan. If not, adjust the input and try again"""
+
+OCTOGEN_CODELLAMA_MID_ERROR_INS = """Adjust the action input and try again for the above output of %s showing the error message"""
diff --git a/sdk/src/og_sdk/agent_sdk.py b/sdk/src/og_sdk/agent_sdk.py
index 17595cc..23e68ba 100644
--- a/sdk/src/og_sdk/agent_sdk.py
+++ b/sdk/src/og_sdk/agent_sdk.py
@@ -186,7 +186,9 @@ async def prompt(self, prompt, api_key, files=[], context_id=None):
         metadata = aio.Metadata(
             ("api_key", api_key),
         )
-        request = agent_server_pb2.ProcessTaskRequest(task=prompt, input_files=files, context_id=context_id)
+        request = agent_server_pb2.ProcessTaskRequest(
+            task=prompt, input_files=files, context_id=context_id
+        )
         async for respond in self.stub.process_task(request, metadata=metadata):
             yield respond