update README and format code

2025-03-11 23:07:31 +08:00 · 2025-03-11 23:07:31 +08:00 · 487b44fda8
commit 487b44fda8
parent 737abe4f90
7 changed files with 85 additions and 56 deletions
--- a/README.md
+++ b/README.md
@ -143,6 +143,9 @@ Join our networking group on Feishu and share your experience with other develop
 Thanks to [anthropic-computer-use](https://github.com/anthropics/anthropic-quickstarts/tree/main/computer-use-demo)
 and [browser-use](https://github.com/browser-use/browser-use) for providing basic support for this project!
 Additionally, we are grateful to [AAAJ](https://github.com/metauto-ai/agent-as-a-judge)
 and [MetaGPT](https://github.com/mannaandpoem/MetaGPT).
 OpenManus is built by contributors from MetaGPT. Huge thanks to this agent community!
 ## Cite
--- a/README_zh.md
+++ b/README_zh.md
@ -145,4 +145,7 @@ python run_flow.py
 特别感谢 [anthropic-computer-use](https://github.com/anthropics/anthropic-quickstarts/tree/main/computer-use-demo)
 和 [browser-use](https://github.com/browser-use/browser-use) 为本项目提供的基础支持！
 此外，我们感谢 [AAAJ](https://github.com/metauto-ai/agent-as-a-judge)
 和 [MetaGPT](https://github.com/mannaandpoem/MetaGPT).
 OpenManus 由 MetaGPT 社区的贡献者共同构建，感谢这个充满活力的智能体开发者社区！
--- a/app/llm/inference.py
+++ b/app/llm/inference.py
@ -1,6 +1,6 @@
 from typing import Dict, List, Literal, Optional, Union, Tuple, Any
 import os
 import base64
 import os
 from typing import Any, Dict, List, Literal, Optional, Tuple, Union
 import litellm
 from litellm import completion, completion_cost
@ -9,12 +9,17 @@ from litellm.exceptions import (
    RateLimitError,
    ServiceUnavailableError,
 )
-from tenacity import retry, stop_after_attempt, wait_random_exponential, retry_if_exception_type
+from tenacity import (
    retry,
    retry_if_exception_type,
    stop_after_attempt,
    wait_random_exponential,
 )
 from app.config import LLMSettings, config
 from app.llm.cost import Cost
 from app.logger import logger
 from app.schema import Message
 from app.llm.cost import Cost
 class LLM:
@ -32,7 +37,9 @@ class LLM:
    def __init__(
        self, config_name: str = "default", llm_config: Optional[LLMSettings] = None
    ):
-        if not hasattr(self, "initialized"):  # Only initialize if not already initialized
+        if not hasattr(
                self, "initialized"
        ):  # Only initialize if not already initialized
            llm_config = llm_config or config.llm
            llm_config = llm_config.get(config_name, llm_config["default"])
@ -41,7 +48,9 @@ class LLM:
            self.temperature = getattr(llm_config, "temperature", 0.7)
            self.top_p = getattr(llm_config, "top_p", 0.9)
            self.api_type = getattr(llm_config, "api_type", "openai")
-            self.api_key = getattr(llm_config, "api_key", os.environ.get("OPENAI_API_KEY", ""))
+            self.api_key = getattr(
                llm_config, "api_key", os.environ.get("OPENAI_API_KEY", "")
            )
            self.api_version = getattr(llm_config, "api_version", "")
            self.base_url = getattr(llm_config, "base_url", "https://api.openai.com/v1")
            self.timeout = getattr(llm_config, "timeout", 60)
@ -183,7 +192,9 @@ class LLM:
            # Add the cost to our tracker
            if cost > 0:
                self.cost_tracker.add_cost(cost)
-                logger.info(f"Added cost: ${cost:.6f}, Total: ${self.cost_tracker.accumulated_cost:.6f}")
+                logger.info(
                    f"Added cost: ${cost:.6f}, Total: ${self.cost_tracker.accumulated_cost:.6f}"
                )
            return cost
        except Exception as e:
@ -202,7 +213,9 @@ class LLM:
                substring in self.base_url
                for substring in ["localhost", "127.0.0.1", "0.0.0.0"]
            )
-        if self.model and (self.model.startswith("ollama") or "local" in self.model.lower()):
+        if self.model and (
                self.model.startswith("ollama") or "local" in self.model.lower()
        ):
            return True
        return False
@ -234,7 +247,9 @@ class LLM:
        with open(image_path, "rb") as image_file:
            return base64.b64encode(image_file.read()).decode("utf-8")
-    def prepare_messages(self, text: str, image_path: Optional[str] = None) -> List[dict]:
+    def prepare_messages(
            self, text: str, image_path: Optional[str] = None
    ) -> List[dict]:
        """
        Prepare messages for completion, including multimodal content if needed.
@ -257,7 +272,9 @@ class LLM:
            ]
        return messages
-    def do_multimodal_completion(self, text: str, image_path: str) -> Tuple[Any, float, float]:
+    def do_multimodal_completion(
            self, text: str, image_path: str
    ) -> Tuple[Any, float, float]:
        """
        Perform a multimodal completion with text and image.
@ -342,7 +359,7 @@ class LLM:
                print(chunk_message, end="", flush=True)
            # For streaming responses, cost is calculated on the last chunk
-            if hasattr(chunk, 'usage') and chunk.usage:
+            if hasattr(chunk, "usage") and chunk.usage:
                self._calculate_and_track_cost(chunk)
            print()  # Newline after streaming
@ -484,6 +501,7 @@ class LLM:
 if __name__ == "__main__":
    # Load environment variables if needed
    from dotenv import load_dotenv
    load_dotenv()
    # Create LLM instance
@ -501,5 +519,7 @@ if __name__ == "__main__":
        multimodal_response, mm_cost, mm_total_cost = llm.do_multimodal_completion(
            "What's in this image?", image_path
        )
-        print(f"Multimodal response: {multimodal_response['choices'][0]['message']['content']}")
+        print(
            f"Multimodal response: {multimodal_response['choices'][0]['message']['content']}"
        )
        print(f"Cost: ${mm_cost:.6f}, Total cost: ${mm_total_cost:.6f}")
--- a/app/tool/browser_use_tool.py
+++ b/app/tool/browser_use_tool.py
@ -11,6 +11,7 @@ from pydantic_core.core_schema import ValidationInfo
 from app.tool.base import BaseTool, ToolResult
 MAX_LENGTH = 2000
 _BROWSER_DESCRIPTION = """
@ -181,7 +182,9 @@ class BrowserUseTool(BaseTool):
                elif action == "get_html":
                    html = await context.get_page_html()
-                    truncated = html[:MAX_LENGTH] + "..." if len(html) > MAX_LENGTH else html
+                    truncated = (
                        html[:MAX_LENGTH] + "..." if len(html) > MAX_LENGTH else html
                    )
                    return ToolResult(output=truncated)
                elif action == "get_text":