From afb049eb061e2c13fa369e1d87a76fb1a6874147 Mon Sep 17 00:00:00 2001 From: makosst <191634637+makosst@users.noreply.github.com> Date: Mon, 29 Sep 2025 23:23:23 -0700 Subject: [PATCH 1/4] Add Manta graph, add .claude to gitignore --- .gitignore | 3 + manta/base-graph.xml | 375 ++++++++++++++++++++++++++++++++++++++++ manta/current-graph.xml | 375 ++++++++++++++++++++++++++++++++++++++++ 3 files changed, 753 insertions(+) create mode 100644 manta/base-graph.xml create mode 100644 manta/current-graph.xml diff --git a/.gitignore b/.gitignore index a7bd963..45f52fe 100644 --- a/.gitignore +++ b/.gitignore @@ -126,6 +126,9 @@ dist # Stores VSCode versions used for testing VSCode extensions .vscode-test +# Claude sub-agents and settings +.claude/ + # yarn v2 .yarn/cache .yarn/unplugged diff --git a/manta/base-graph.xml b/manta/base-graph.xml new file mode 100644 index 0000000..812879d --- /dev/null +++ b/manta/base-graph.xml @@ -0,0 +1,375 @@ + + + + + The central orchestration engine for HyperAgent that manages task execution, LLM interactions, and action coordination. This system handles the main agent lifecycle including task planning, step execution, and state management. + + src/agent/index.ts + src/agent/tools/agent.ts + src/agent/tools/types.ts + src/agent/error.ts + src/agent/llms/structured-output.ts + + + + OpenAI + + + + + + + 128000 + false + + 0 + 0 + + + 0 + + + + + + + + + + + + + + The browser control and interaction layer that provides abstracted access to different browser providers (Local Playwright and Hyperbrowser cloud). This layer manages browser sessions, page navigation, and browser-specific operations. + + src/browser-providers/index.ts + src/browser-providers/local.ts + src/browser-providers/hyperbrowser.ts + src/types/browser-providers/types.ts + + + + Local + + + + + + + false + 0 + 0 + + + + + + + + + + + + + + 0 + false + + + + + + The data extraction and context gathering system that analyzes web pages to extract meaningful information for the agent. This includes DOM analysis, interactive element detection, screenshot processing, and content conversion to markdown. + + src/context-providers/dom/index.ts + src/context-providers/dom/build-dom-view.ts + src/context-providers/dom/find-interactive-elements.ts + src/context-providers/dom/highlight.ts + src/context-providers/dom/inject/build-dom-view.ts + src/context-providers/dom/types.ts + src/utils/html-to-markdown.ts + + + + 0 + 0 + + + false + false + + + false + false + + + false + + + + + + + The action execution system that provides a comprehensive set of browser automation actions including clicking, typing, navigation, and data extraction. This system handles action validation, execution, and result formatting for agent operations. + + src/agent/actions/index.ts + src/agent/actions/click-element.ts + src/agent/actions/input-text.ts + src/agent/actions/go-to-url.ts + src/agent/actions/scroll.ts + src/agent/actions/extract.ts + src/agent/actions/complete.ts + src/agent/actions/key-press.ts + src/agent/actions/select-option.ts + src/agent/actions/pdf.ts + src/agent/actions/utils.ts + src/types/agent/actions/types.ts + + + + + click-element + true + + + input-text + true + + + go-to-url + true + + + scroll + true + + + extract + true + + + 30000 + + 0 + 0 + + + false + false + + + + + + The command-line interface that provides user interaction capabilities for HyperAgent. This system handles user input, task management controls, progress visualization, and interactive prompts for a seamless terminal-based experience. + + src/cli/index.ts + + + + interactive + + + + + + + + false + false + false + + + + + + + + false + false + + + + + + The Model Context Protocol (MCP) integration system that enables HyperAgent to connect with external tools and services. This layer manages MCP server connections, tool registration, and provides extensible capabilities through protocol-based integrations. + + src/agent/mcp/client.ts + src/types/config.ts + + + + + + stdio + + + + + + true + + + + sse + + + + + + true + + + + 0 + 0 + + + false + false + + + false + 0 + + + + + + The extensible custom actions framework that allows users to define and register custom automation behaviors. This system provides user interaction capabilities and serves as a foundation for extending HyperAgent's functionality beyond built-in actions. + + src/custom-actions/index.ts + src/custom-actions/user-interaction.ts + + + + false + false + false + false + + + false + false + 0 + + + false + 0 + + + false + false + + + + + + The supporting infrastructure and utility components that provide foundational services across HyperAgent. This includes error handling, retry mechanisms, HTML processing, type definitions, and other shared utilities that enable the core functionality. + + src/utils/index.ts + src/utils/error-emitter.ts + src/utils/retry.ts + src/utils/sleep.ts + src/utils/html-to-markdown.ts + src/types/index.ts + src/types/agent/types.ts + src/types/config.ts + + + + false + false + false + + + 0 + false + 0 + + + false + false + false + + + false + false + + + + + + The examples and documentation system that provides usage patterns, integration samples, and implementation guides for HyperAgent. This includes examples for different LLM providers, browser configurations, MCP integrations, and custom tool implementations. + + examples/llms/anthropic.ts + examples/llms/openai.ts + examples/browser-providers/hyperbrowser.ts + examples/mcp/google-sheets/best-buy-reviews.ts + examples/mcp/google-sheets/car-price-comparison.ts + examples/mcp/notion/create-shopping-list.ts + examples/custom-tool/search/exa.ts + examples/simple/add-to-amazon-cart.ts + examples/output-to-schema/output-to-schema.ts + + + + + LLM Providers + 2 + + + Browser Providers + 1 + + + MCP Integrations + 5 + + + Custom Tools + 2 + + + Simple Tasks + 1 + + + + false + false + false + + + false + false + false + + + false + false + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/manta/current-graph.xml b/manta/current-graph.xml new file mode 100644 index 0000000..812879d --- /dev/null +++ b/manta/current-graph.xml @@ -0,0 +1,375 @@ + + + + + The central orchestration engine for HyperAgent that manages task execution, LLM interactions, and action coordination. This system handles the main agent lifecycle including task planning, step execution, and state management. + + src/agent/index.ts + src/agent/tools/agent.ts + src/agent/tools/types.ts + src/agent/error.ts + src/agent/llms/structured-output.ts + + + + OpenAI + + + + + + + 128000 + false + + 0 + 0 + + + 0 + + + + + + + + + + + + + + The browser control and interaction layer that provides abstracted access to different browser providers (Local Playwright and Hyperbrowser cloud). This layer manages browser sessions, page navigation, and browser-specific operations. + + src/browser-providers/index.ts + src/browser-providers/local.ts + src/browser-providers/hyperbrowser.ts + src/types/browser-providers/types.ts + + + + Local + + + + + + + false + 0 + 0 + + + + + + + + + + + + + + 0 + false + + + + + + The data extraction and context gathering system that analyzes web pages to extract meaningful information for the agent. This includes DOM analysis, interactive element detection, screenshot processing, and content conversion to markdown. + + src/context-providers/dom/index.ts + src/context-providers/dom/build-dom-view.ts + src/context-providers/dom/find-interactive-elements.ts + src/context-providers/dom/highlight.ts + src/context-providers/dom/inject/build-dom-view.ts + src/context-providers/dom/types.ts + src/utils/html-to-markdown.ts + + + + 0 + 0 + + + false + false + + + false + false + + + false + + + + + + + The action execution system that provides a comprehensive set of browser automation actions including clicking, typing, navigation, and data extraction. This system handles action validation, execution, and result formatting for agent operations. + + src/agent/actions/index.ts + src/agent/actions/click-element.ts + src/agent/actions/input-text.ts + src/agent/actions/go-to-url.ts + src/agent/actions/scroll.ts + src/agent/actions/extract.ts + src/agent/actions/complete.ts + src/agent/actions/key-press.ts + src/agent/actions/select-option.ts + src/agent/actions/pdf.ts + src/agent/actions/utils.ts + src/types/agent/actions/types.ts + + + + + click-element + true + + + input-text + true + + + go-to-url + true + + + scroll + true + + + extract + true + + + 30000 + + 0 + 0 + + + false + false + + + + + + The command-line interface that provides user interaction capabilities for HyperAgent. This system handles user input, task management controls, progress visualization, and interactive prompts for a seamless terminal-based experience. + + src/cli/index.ts + + + + interactive + + + + + + + + false + false + false + + + + + + + + false + false + + + + + + The Model Context Protocol (MCP) integration system that enables HyperAgent to connect with external tools and services. This layer manages MCP server connections, tool registration, and provides extensible capabilities through protocol-based integrations. + + src/agent/mcp/client.ts + src/types/config.ts + + + + + + stdio + + + + + + true + + + + sse + + + + + + true + + + + 0 + 0 + + + false + false + + + false + 0 + + + + + + The extensible custom actions framework that allows users to define and register custom automation behaviors. This system provides user interaction capabilities and serves as a foundation for extending HyperAgent's functionality beyond built-in actions. + + src/custom-actions/index.ts + src/custom-actions/user-interaction.ts + + + + false + false + false + false + + + false + false + 0 + + + false + 0 + + + false + false + + + + + + The supporting infrastructure and utility components that provide foundational services across HyperAgent. This includes error handling, retry mechanisms, HTML processing, type definitions, and other shared utilities that enable the core functionality. + + src/utils/index.ts + src/utils/error-emitter.ts + src/utils/retry.ts + src/utils/sleep.ts + src/utils/html-to-markdown.ts + src/types/index.ts + src/types/agent/types.ts + src/types/config.ts + + + + false + false + false + + + 0 + false + 0 + + + false + false + false + + + false + false + + + + + + The examples and documentation system that provides usage patterns, integration samples, and implementation guides for HyperAgent. This includes examples for different LLM providers, browser configurations, MCP integrations, and custom tool implementations. + + examples/llms/anthropic.ts + examples/llms/openai.ts + examples/browser-providers/hyperbrowser.ts + examples/mcp/google-sheets/best-buy-reviews.ts + examples/mcp/google-sheets/car-price-comparison.ts + examples/mcp/notion/create-shopping-list.ts + examples/custom-tool/search/exa.ts + examples/simple/add-to-amazon-cart.ts + examples/output-to-schema/output-to-schema.ts + + + + + LLM Providers + 2 + + + Browser Providers + 1 + + + MCP Integrations + 5 + + + Custom Tools + 2 + + + Simple Tasks + 1 + + + + false + false + false + + + false + false + false + + + false + false + + + + + + + + + + + + + + + + + + + + + + + + + From 923f8a6daf11e25d72a1852789a14c9860c4f029 Mon Sep 17 00:00:00 2001 From: Konstantin Marunchenko Date: Mon, 13 Oct 2025 00:16:21 -0700 Subject: [PATCH 2/4] Update .gitignore --- .gitignore | 3 --- 1 file changed, 3 deletions(-) diff --git a/.gitignore b/.gitignore index 45f52fe..a7bd963 100644 --- a/.gitignore +++ b/.gitignore @@ -126,9 +126,6 @@ dist # Stores VSCode versions used for testing VSCode extensions .vscode-test -# Claude sub-agents and settings -.claude/ - # yarn v2 .yarn/cache .yarn/unplugged From 53a13af55ff83ed667f20e7f493803f747170e03 Mon Sep 17 00:00:00 2001 From: Konstantin Marunchenko Date: Mon, 13 Oct 2025 00:17:08 -0700 Subject: [PATCH 3/4] Delete manta directory --- manta/base-graph.xml | 375 ---------------------------------------- manta/current-graph.xml | 375 ---------------------------------------- 2 files changed, 750 deletions(-) delete mode 100644 manta/base-graph.xml delete mode 100644 manta/current-graph.xml diff --git a/manta/base-graph.xml b/manta/base-graph.xml deleted file mode 100644 index 812879d..0000000 --- a/manta/base-graph.xml +++ /dev/null @@ -1,375 +0,0 @@ - - - - - The central orchestration engine for HyperAgent that manages task execution, LLM interactions, and action coordination. This system handles the main agent lifecycle including task planning, step execution, and state management. - - src/agent/index.ts - src/agent/tools/agent.ts - src/agent/tools/types.ts - src/agent/error.ts - src/agent/llms/structured-output.ts - - - - OpenAI - - - - - - - 128000 - false - - 0 - 0 - - - 0 - - - - - - - - - - - - - - The browser control and interaction layer that provides abstracted access to different browser providers (Local Playwright and Hyperbrowser cloud). This layer manages browser sessions, page navigation, and browser-specific operations. - - src/browser-providers/index.ts - src/browser-providers/local.ts - src/browser-providers/hyperbrowser.ts - src/types/browser-providers/types.ts - - - - Local - - - - - - - false - 0 - 0 - - - - - - - - - - - - - - 0 - false - - - - - - The data extraction and context gathering system that analyzes web pages to extract meaningful information for the agent. This includes DOM analysis, interactive element detection, screenshot processing, and content conversion to markdown. - - src/context-providers/dom/index.ts - src/context-providers/dom/build-dom-view.ts - src/context-providers/dom/find-interactive-elements.ts - src/context-providers/dom/highlight.ts - src/context-providers/dom/inject/build-dom-view.ts - src/context-providers/dom/types.ts - src/utils/html-to-markdown.ts - - - - 0 - 0 - - - false - false - - - false - false - - - false - - - - - - - The action execution system that provides a comprehensive set of browser automation actions including clicking, typing, navigation, and data extraction. This system handles action validation, execution, and result formatting for agent operations. - - src/agent/actions/index.ts - src/agent/actions/click-element.ts - src/agent/actions/input-text.ts - src/agent/actions/go-to-url.ts - src/agent/actions/scroll.ts - src/agent/actions/extract.ts - src/agent/actions/complete.ts - src/agent/actions/key-press.ts - src/agent/actions/select-option.ts - src/agent/actions/pdf.ts - src/agent/actions/utils.ts - src/types/agent/actions/types.ts - - - - - click-element - true - - - input-text - true - - - go-to-url - true - - - scroll - true - - - extract - true - - - 30000 - - 0 - 0 - - - false - false - - - - - - The command-line interface that provides user interaction capabilities for HyperAgent. This system handles user input, task management controls, progress visualization, and interactive prompts for a seamless terminal-based experience. - - src/cli/index.ts - - - - interactive - - - - - - - - false - false - false - - - - - - - - false - false - - - - - - The Model Context Protocol (MCP) integration system that enables HyperAgent to connect with external tools and services. This layer manages MCP server connections, tool registration, and provides extensible capabilities through protocol-based integrations. - - src/agent/mcp/client.ts - src/types/config.ts - - - - - - stdio - - - - - - true - - - - sse - - - - - - true - - - - 0 - 0 - - - false - false - - - false - 0 - - - - - - The extensible custom actions framework that allows users to define and register custom automation behaviors. This system provides user interaction capabilities and serves as a foundation for extending HyperAgent's functionality beyond built-in actions. - - src/custom-actions/index.ts - src/custom-actions/user-interaction.ts - - - - false - false - false - false - - - false - false - 0 - - - false - 0 - - - false - false - - - - - - The supporting infrastructure and utility components that provide foundational services across HyperAgent. This includes error handling, retry mechanisms, HTML processing, type definitions, and other shared utilities that enable the core functionality. - - src/utils/index.ts - src/utils/error-emitter.ts - src/utils/retry.ts - src/utils/sleep.ts - src/utils/html-to-markdown.ts - src/types/index.ts - src/types/agent/types.ts - src/types/config.ts - - - - false - false - false - - - 0 - false - 0 - - - false - false - false - - - false - false - - - - - - The examples and documentation system that provides usage patterns, integration samples, and implementation guides for HyperAgent. This includes examples for different LLM providers, browser configurations, MCP integrations, and custom tool implementations. - - examples/llms/anthropic.ts - examples/llms/openai.ts - examples/browser-providers/hyperbrowser.ts - examples/mcp/google-sheets/best-buy-reviews.ts - examples/mcp/google-sheets/car-price-comparison.ts - examples/mcp/notion/create-shopping-list.ts - examples/custom-tool/search/exa.ts - examples/simple/add-to-amazon-cart.ts - examples/output-to-schema/output-to-schema.ts - - - - - LLM Providers - 2 - - - Browser Providers - 1 - - - MCP Integrations - 5 - - - Custom Tools - 2 - - - Simple Tasks - 1 - - - - false - false - false - - - false - false - false - - - false - false - - - - - - - - - - - - - - - - - - - - - - - - - diff --git a/manta/current-graph.xml b/manta/current-graph.xml deleted file mode 100644 index 812879d..0000000 --- a/manta/current-graph.xml +++ /dev/null @@ -1,375 +0,0 @@ - - - - - The central orchestration engine for HyperAgent that manages task execution, LLM interactions, and action coordination. This system handles the main agent lifecycle including task planning, step execution, and state management. - - src/agent/index.ts - src/agent/tools/agent.ts - src/agent/tools/types.ts - src/agent/error.ts - src/agent/llms/structured-output.ts - - - - OpenAI - - - - - - - 128000 - false - - 0 - 0 - - - 0 - - - - - - - - - - - - - - The browser control and interaction layer that provides abstracted access to different browser providers (Local Playwright and Hyperbrowser cloud). This layer manages browser sessions, page navigation, and browser-specific operations. - - src/browser-providers/index.ts - src/browser-providers/local.ts - src/browser-providers/hyperbrowser.ts - src/types/browser-providers/types.ts - - - - Local - - - - - - - false - 0 - 0 - - - - - - - - - - - - - - 0 - false - - - - - - The data extraction and context gathering system that analyzes web pages to extract meaningful information for the agent. This includes DOM analysis, interactive element detection, screenshot processing, and content conversion to markdown. - - src/context-providers/dom/index.ts - src/context-providers/dom/build-dom-view.ts - src/context-providers/dom/find-interactive-elements.ts - src/context-providers/dom/highlight.ts - src/context-providers/dom/inject/build-dom-view.ts - src/context-providers/dom/types.ts - src/utils/html-to-markdown.ts - - - - 0 - 0 - - - false - false - - - false - false - - - false - - - - - - - The action execution system that provides a comprehensive set of browser automation actions including clicking, typing, navigation, and data extraction. This system handles action validation, execution, and result formatting for agent operations. - - src/agent/actions/index.ts - src/agent/actions/click-element.ts - src/agent/actions/input-text.ts - src/agent/actions/go-to-url.ts - src/agent/actions/scroll.ts - src/agent/actions/extract.ts - src/agent/actions/complete.ts - src/agent/actions/key-press.ts - src/agent/actions/select-option.ts - src/agent/actions/pdf.ts - src/agent/actions/utils.ts - src/types/agent/actions/types.ts - - - - - click-element - true - - - input-text - true - - - go-to-url - true - - - scroll - true - - - extract - true - - - 30000 - - 0 - 0 - - - false - false - - - - - - The command-line interface that provides user interaction capabilities for HyperAgent. This system handles user input, task management controls, progress visualization, and interactive prompts for a seamless terminal-based experience. - - src/cli/index.ts - - - - interactive - - - - - - - - false - false - false - - - - - - - - false - false - - - - - - The Model Context Protocol (MCP) integration system that enables HyperAgent to connect with external tools and services. This layer manages MCP server connections, tool registration, and provides extensible capabilities through protocol-based integrations. - - src/agent/mcp/client.ts - src/types/config.ts - - - - - - stdio - - - - - - true - - - - sse - - - - - - true - - - - 0 - 0 - - - false - false - - - false - 0 - - - - - - The extensible custom actions framework that allows users to define and register custom automation behaviors. This system provides user interaction capabilities and serves as a foundation for extending HyperAgent's functionality beyond built-in actions. - - src/custom-actions/index.ts - src/custom-actions/user-interaction.ts - - - - false - false - false - false - - - false - false - 0 - - - false - 0 - - - false - false - - - - - - The supporting infrastructure and utility components that provide foundational services across HyperAgent. This includes error handling, retry mechanisms, HTML processing, type definitions, and other shared utilities that enable the core functionality. - - src/utils/index.ts - src/utils/error-emitter.ts - src/utils/retry.ts - src/utils/sleep.ts - src/utils/html-to-markdown.ts - src/types/index.ts - src/types/agent/types.ts - src/types/config.ts - - - - false - false - false - - - 0 - false - 0 - - - false - false - false - - - false - false - - - - - - The examples and documentation system that provides usage patterns, integration samples, and implementation guides for HyperAgent. This includes examples for different LLM providers, browser configurations, MCP integrations, and custom tool implementations. - - examples/llms/anthropic.ts - examples/llms/openai.ts - examples/browser-providers/hyperbrowser.ts - examples/mcp/google-sheets/best-buy-reviews.ts - examples/mcp/google-sheets/car-price-comparison.ts - examples/mcp/notion/create-shopping-list.ts - examples/custom-tool/search/exa.ts - examples/simple/add-to-amazon-cart.ts - examples/output-to-schema/output-to-schema.ts - - - - - LLM Providers - 2 - - - Browser Providers - 1 - - - MCP Integrations - 5 - - - Custom Tools - 2 - - - Simple Tasks - 1 - - - - false - false - false - - - false - false - false - - - false - false - - - - - - - - - - - - - - - - - - - - - - - - - From 2ae9ac1f75b65225923c69354489832802a03eea Mon Sep 17 00:00:00 2001 From: Konstantin Marunchenko Date: Mon, 13 Oct 2025 00:21:44 -0700 Subject: [PATCH 4/4] Update README.md --- README.md | 3 +++ 1 file changed, 3 insertions(+) diff --git a/README.md b/README.md index 463e364..4e550fc 100644 --- a/README.md +++ b/README.md @@ -12,6 +12,9 @@ license + + HyperAgent graph on Manta + Discord